In [20]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import networkx as nx
import brewer2mpl
import math
from datetime import datetime
from Bio import AlignIO, SeqIO
from Bio.SeqRecord import SeqRecord
from Bio.Align.Applications import ClustalOmegaCommandline
from __future__ import division
from Bio.Seq import Seq
from collections import Counter
from sdi import sdi
from copy import deepcopy
from random import shuffle
from scipy.stats.mstats import mquantiles
from sklearn.ensemble import RandomForestClassifier
from sklearn.preprocessing import LabelEncoder
%matplotlib inline
Truc has the dataset in one massive spreadsheet right now. I am going to filter out:
Also, I will have to check that the accessions are "complete CDS" and not "partial CDS" - this is proxied by filtering on the "trimmed sequences" column such that anything that doesn't start with an "ATG" and have a CDS that is > 500 a.a. is filtered out.
In [2]:
data = pd.read_csv('H9_HA_dataset.csv', index_col='Accession ')
data = data[data['Trimmed Sequence*'].str[0:3] == 'ATG']
data['Trimmed Sequence*'] = data['Trimmed Sequence*'].str.replace('~', '')
data['Trimmed Sequence*'] = data['Trimmed Sequence*'].str.replace('-', '')
data['Sequence Length'] = data['Trimmed Sequence*'].str.len()
data = data[data['HostType_Code1'] != 'Avian (unidentified)'] # filter out unidentified
data['Geo_Code'] = data['Geo_Code'].str.replace('_', '.')
plt.hist(data['Sequence Length'].values, bins=100)
plt.show()
data = data[data['Sequence Length'] > 1600] # filter out non-full length
data
Out[2]:
Host
Species
HostCategory_Islam
HostTaxa_Nic
HostType_Nic
HostType_Code1
HostType_Code1S
HostType_Code2
HostOrder_Nic
Geo_Code
...
Date_Est
Gene segment
Taxa label
Trimmed Sequence*
Unnamed: 22
Unnamed: 23
Unnamed: 24
Unnamed: 25
Unnamed: 26
Sequence Length
Accession
CY031275
Avian
duck-quail adapted
?
Poultry
Domestic animal
Domestic
D
Quail
Galliformes
China.Central
...
1979-06-15
>4
A/duck/Hong Kong/702/1979-quail adapted
ATGGAAACAAAAGCACTAATAGCTATACTGTTAATGGTAACAACAA...
NaN
NaN
NaN
NaN
NaN
1709
KF188339
Avian
goose
Anseriformes
Anseriformes
Wild bird
Wild
W
Anseriformes
Anseriformes
N.Amer
...
1980-06-15
>4
A/goose/Minnesota/5733-1243/1980
ATGGAAACAACAACACTAATAGCTATACTGCTAATGGTAACAGCAA...
NaN
NaN
NaN
NaN
NaN
1683
KF188287
Avian
turkey
Poultry
Poultry
Domestic animal
Domestic
D
Turkey
Galliformes
Europe
...
1983-06-15
>4
A/turkey/Pavia/141/1983
ATGGAGACAATAGCACCAATAGCTATACTGTTAATGGTAACAGCAG...
NaN
NaN
NaN
NaN
NaN
1683
CY005919
Avian
mallard
Anseriformes
Anseriformes
Wild bird
Wild
W
Anseriformes
Anseriformes
N.Amer
...
1983-08-07
>4
A/mallard duck/ALB/396/1983
ATGGAAATAACAACACTAATAGCTATACTGCTAATGGTAACAGCAA...
NaN
NaN
NaN
NaN
NaN
1709
CY101406
Avian
ruddy turnstone
Charadriiformes
Charadriiformes
Wild bird
Wild
W
Charadriiformes
Charadriiformes
N.Amer
...
1987-05-19
>4
A/ruddy turnstone/Delaware Bay/2795/1987
ATGGAAATAACAACACTAGTAGCTATACTGCTAATGGTAACAGCAA...
NaN
NaN
NaN
NaN
NaN
1696
CY005986
Avian
laughing gull
Charadriiformes
Charadriiformes
Wild bird
Wild
W
Charadriiformes
Charadriiformes
N.Amer
...
1987-06-09
>4
A/laughing gull/Delaware Bay/2718/1987
ATGGAAATAACAACACTAGTAGCTATACTGCTAATGGTAACAGCAA...
NaN
NaN
NaN
NaN
NaN
1709
CY101507
Avian
ruddy turnstone
Charadriiformes
Charadriiformes
Wild bird
Wild
W
Charadriiformes
Charadriiformes
N.Amer
...
1988-05-28
>4
A/ruddy turnstone/Virginia/2297/1988
ATGGAAATAACAACACTAGTAGCTATACTGATAATGGTAACAGCAA...
NaN
NaN
NaN
NaN
NaN
1696
AB303077
Avian
mallard
Anseriformes
Anseriformes
Wild bird
Wild
W
Anseriformes
Anseriformes
Europe
...
1993-06-15
>4
A/mallard/Ireland/PV46B/1993
ATGGAAATAACAGCATTAATAGCTATACTGTTAGTGACAACAACAA...
NaN
NaN
NaN
NaN
NaN
1690
AF156379
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
China.Central
...
1994-06-15
>4
A/Chicken/Hong Kong/739/94
ATGGAAACAATATCACTAATAACTATACTACTAGTAATAACAGCAA...
NaN
NaN
NaN
NaN
NaN
1671
HE802066
Avian
duck
?
Duck (unidentified)
Wild bird
Wild
W
Anseriformes
Anseriformes
Europe
...
1995-06-15
>4
A/duck/Germany/113/1995
ATGGAAATAATAGCACTAATAGCTATACTGTTAGTGACAACAACAA...
NaN
NaN
NaN
NaN
NaN
1709
JX273569
Avian
turkey
Poultry
Poultry
Domestic animal
Domestic
D
Turkey
Galliformes
Europe
...
1995-06-15
>4
A/turkey/Germany/EK224/1995
ATGGAAATAATAGCATTAATAGCTATACTGTTAGTGACAACAACAA...
NaN
NaN
NaN
NaN
NaN
1709
CY102188
Avian
shorebird
Charadriiformes
Charadriiformes
Wild bird
Wild
W
Charadriiformes
Charadriiformes
N.Amer
...
1996-05-14
>4
A/shorebird/Delaware Bay/31/1996
ATGGAAACCAGAACACTAATAGCTGCGCTTCTGATTGTAACAACAA...
NaN
NaN
NaN
NaN
NaN
1683
DQ064377
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
E.Asia.E.China
...
1996-06-15
>4
A/chicken/Shandong/7/96
ATGGAAACAACATCACTAATAACTATACTACTACTAGTAACAACAA...
NaN
NaN
NaN
NaN
NaN
1709
GU053186
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
E.Asia.E.China
...
1996-06-15
>4
A/chicken/Korea/MS96-CE6/1996
ATGGAAATAATAGCACTAATAGCTATACTGGTAGTGACAAAAACAA...
NaN
NaN
NaN
NaN
NaN
1696
AB049159
Avian
parakeet
Passeriformes?
Psittaciformes
Captive wild
Wild
W
Other
NaN
E.Asia.E.China
...
1997-06-15
>4
A/parakeet/Chiba/1/97
ATGGAAACAATATCACTACTAACTATACTACTAGTAGTAACAGCAA...
NaN
NaN
NaN
NaN
NaN
1683
AB432938
Avian
duck
Poultry
Poultry
Domestic animal
Domestic
D
DomDuckGeese
Anseriformes
China.Central
...
1997-06-15
>4
A/duck/Hong Kong/W213/1997
ATGGAAGCAGTATCACTAATAACTATACTACTAGTAGTAACAGCAA...
NaN
NaN
NaN
NaN
NaN
1683
DQ064360
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
China.Central
...
1997-06-15
>4
A/chicken/Guangdong/5/97
ATGGAAGCAGTATCACTAATAACTATACTACTAGTAGTAACAGCAA...
NaN
NaN
NaN
NaN
NaN
1709
JQ344328
Avian
duck
?
Poultry
Domestic animal
Domestic
D
DomDuckGeese
Anseriformes
SE.Asia
...
1997-09-24
>4
A/duck/Malaysia/91/1997
ATGGAAGCAACAGCAATAATAACCATACTATTAGTAATAACAGCAA...
NaN
NaN
NaN
NaN
NaN
1709
KF800947
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
Middle.East
...
1998-02-02
>4
A/chicken/Iran/av1221/1998
ATGGAACAGGTATCACTAATAACTATACTACTAGTAGTAACAGCAA...
NaN
NaN
NaN
NaN
NaN
1683
AB049160
Avian
parakeet
Passeriformes?
Psittaciformes
Captive wild
Wild
W
Other
NaN
E.Asia.E.China
...
1998-06-15
>4
A/parakeet/Narita/92A/98
ATGGAAACAATATCACTAATAACTATACTACTAGTAGTAACAGCAA...
NaN
NaN
NaN
NaN
NaN
1683
AF461510
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
E.Asia.E.China
...
1998-06-15
>4
A/Chicken/Jiangsu/2/98
ATGGAAACAATATCACTAATAACTATACTACTAGTAGTAACAGTAA...
NaN
NaN
NaN
NaN
NaN
1683
AY743216
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
E.Asia.E.China
...
1998-06-15
>4
A/Chicken/Shanghai/F/98
ATGGAAACAATATCACTAATAGCTATACTACTAGTAGTAACAGTAA...
NaN
NaN
NaN
NaN
NaN
1709
CY081264
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
Middle.East
...
1998-06-15
>4
A/chicken/Saudi Arabia/CP7/1998
ATGGAAACAATATCACTAATAACTATACTACTAGTAGTAACAGCAA...
NaN
NaN
NaN
NaN
NaN
1680
FJ794817
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
Middle.East
...
1998-06-15
>4
A/chicken/Iran/SS1/1998
ATGGAAACAGTATCACTAATAACTATACTACTAGTAGTAACAGCAA...
NaN
NaN
NaN
NaN
NaN
1709
JQ419725
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
Middle.East
...
1998-06-15
>4
A/chicken/Iran/725/1998
ATGGAAACAACATCACTGTTAACTATACTACTAGTAGTAACAACAA...
NaN
NaN
NaN
NaN
NaN
1677
GQ497118
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
Middle.East
...
1998-10-26
>4
A/chicken/Iran/661/1998
ATGGAACAGGTATCACTAATAACTATACTACTAGTAGTAACAGCAA...
NaN
NaN
NaN
NaN
NaN
1677
AF461512
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
China.West
...
1999-06-15
>4
A/Chicken/Gansu/1/99
ATGGAAACAATATCACTAATAACTATACTACTAATAGTAACAGCAG...
NaN
NaN
NaN
NaN
NaN
1683
AF461528
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
China.West
...
1999-06-15
>4
A/Chicken/Yunnan/1/99
ATGGAAACAATATCACTAATAACTATAATACTAGTAGTAACGGTAA...
NaN
NaN
NaN
NaN
NaN
1683
AF508556
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
S.Asia
...
1999-06-15
>4
A/chicken/Pakistan/5/99
ATGGAAACAAGATCACTAATAACTATACTACTAGTAGTAACAGCAA...
NaN
NaN
NaN
NaN
NaN
1648
AF508568
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
China.West
...
1999-06-15
>4
A/Chicken/Ningxia/5/99
ATGGAAACAATATCACTAATAACTATACTACTAGTAGTAACAGCAA...
NaN
NaN
NaN
NaN
NaN
1634
...
...
...
...
...
...
...
...
...
...
...
...
...
...
...
...
...
...
...
...
...
...
JN804540
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
China.Central
...
2011-07-15
>4
A/chicken/Shanxi/43/2011
ATGGAGACAGTATCACTAATAACTATACTACTAGTAGTAACAGTAA...
NaN
NaN
NaN
NaN
NaN
1675
JN804542
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
China.West
...
2011-07-15
>4
A/chicken/Chongqing/K7/2011
ATGGAGACAGCATCACTAATAACTATGCTACTAGTAGCAACAGTAA...
NaN
NaN
NaN
NaN
NaN
1675
JN804543
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
China.West
...
2011-07-15
>4
A/chicken/Chongqing/K16/2011
ATGGAGACAGTATCTCTAATAACTATACTACTAGTATTAACAGTAA...
NaN
NaN
NaN
NaN
NaN
1675
JN804544
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
China.West
...
2011-07-15
>4
A/chicken/Chongqing/K3/2011
ATGGAGACAGTATCTCTAATAACTATACTACTAGTATTAACAGTAA...
NaN
NaN
NaN
NaN
NaN
1675
JN804545
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
China.West
...
2011-07-15
>4
A/chicken/Chongqing/A56/2011
ATGGAGACAGTATCTCTAATAACTATACTACTAGTATTAACAGTAA...
NaN
NaN
NaN
NaN
NaN
1675
JN804547
Avian
duck
Poultry
Poultry
Domestic animal
Domestic
D
DomDuckGeese
Anseriformes
China.West
...
2011-07-15
>4
A/duck/Chongqing/B36/2011
ATGGAGACAGTATCTCTAATAACTATACTACTAGTATTAACAGTAA...
NaN
NaN
NaN
NaN
NaN
1675
JN804557
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
China.Central
...
2011-07-15
>4
A/chicken/Guangdong/286/2011
ATGGAAGCAGCAACAATAATAACTATACTACTAGCAATAACAGGAA...
NaN
NaN
NaN
NaN
NaN
1675
JQ906555
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
Middle.East
...
2011-10-15
>4
A/chicken/Egypt/115636V/2011
ATGGAAATAACACCACTGATGACTATACTACTATTAGTAACAACAA...
NaN
NaN
NaN
NaN
NaN
1683
KC162234
Avian
baikal teal
Anseriformes
Anseriformes
Wild bird
Wild
W
Anseriformes
Anseriformes
E.Asia.E.China
...
2011-10-15
>4
A/baikal teal/Xianghai/421/2011
ATGGAAATAATAGCACTAATAGCTATACTATTAGTAACAACAACGA...
NaN
NaN
NaN
NaN
NaN
1683
CY110927
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
Middle.East
...
2011-12-15
>4
A/chicken/Egypt/S4454E/2011
ATGGAAATAATACCACTGACGACTATACTACTATTAGTAACAACAA...
NaN
NaN
NaN
NaN
NaN
1685
CY110928
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
Middle.East
...
2011-12-15
>4
A/chicken/Egypt/S4456B/2011
ATGGAAATAATACCACTGACGACTATACTACTATTAGTAACAACAA...
NaN
NaN
NaN
NaN
NaN
1683
JQ770133
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
China.Central
...
2011-12-15
>4
A/chicken/Guangdong/LJT12/2011
ATGGAAGTAGTATCACTAATAACTATACTACTAGTAATAACAGGAA...
NaN
NaN
NaN
NaN
NaN
1683
JQ973658
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
Middle.East
...
2011-12-15
>4
A/chicken/Israel/1115/2011
ATGGAAATAATATCACTGATGACTATACTACTGGTGGTAACAACAA...
NaN
NaN
NaN
NaN
NaN
1680
JQ973660
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
Middle.East
...
2011-12-15
>4
A/chicken/Israel/1164/2011
ATGGAAATAACATCACTGATGACTATACTACTAGTAATAACAACAA...
NaN
NaN
NaN
NaN
NaN
1680
JQ973652
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
Middle.East
...
2012-01-15
>4
A/chicken/Israel/11/2012
ATGGAAACAATATCACTGATGACTATACTACTGGTGGTAACAACAA...
NaN
NaN
NaN
NaN
NaN
1680
JQ973653
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
Middle.East
...
2012-01-15
>4
A/chicken/Israel/46/2012
ATGGAACCAATATCACTGATGACTATACTACTGGTGGTAACAACAA...
NaN
NaN
NaN
NaN
NaN
1680
JQ973654
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
Middle.East
...
2012-01-15
>4
A/chicken/Israel/50/2012
ATGGAAATAATATCACTGATGACTGTACTACTAGTAGTAACAACAA...
NaN
NaN
NaN
NaN
NaN
1680
KC417046
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
E.Asia.E.China
...
2012-01-15
>4
A/chicken/Shanghai/C1/2012
ATGGAAGTAGTATCACTAATAACTATACTACTAGTAGCAACAGTAA...
NaN
NaN
NaN
NaN
NaN
1683
JQ906557
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
Middle.East
...
2012-02-15
>4
A/chicken/Egypt/1226B/2012
ATGGAAATAATACCACTGACGACTATACTACTATTAGTAACAACAA...
NaN
NaN
NaN
NaN
NaN
1652
JQ906558
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
Middle.East
...
2012-02-15
>4
A/chicken/Egypt/1231B/2012
ATGGAAATAATACCACTGATGACTGTACTGCTATTAGTAACATCAA...
NaN
NaN
NaN
NaN
NaN
1652
KC817014
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
China.Central
...
2012-02-15
>4
A/chicken/Henan/ZK2/2012
ATGGAGACAGCATCGCTGATGACTATACTACTAGTAGTAACAGTAA...
NaN
NaN
NaN
NaN
NaN
1683
JX448765
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
E.Asia.E.China
...
2012-03-15
>4
A/chicken/Fujian/SN2/2012
ATGGAAGTAGTATCACTGATAACTACACTGTTAGCAGTAACAACAA...
NaN
NaN
NaN
NaN
NaN
1683
JX846585
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
China.Central
...
2012-06-15
>4
A/chicken/Henan/YX/2012
ATGGAAGTAGTATCACTAATAACTATACTACTAGTAGTAACAGTAT...
NaN
NaN
NaN
NaN
NaN
1683
KC951122
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
China.Central
...
2013-01-15
>4
A/chicken/Guangdong/LG1/2013
ATGGAGACAGTATCACTAATAACTATACTACTAGTAGCAACAATAA...
NaN
NaN
NaN
NaN
NaN
1683
KF918709
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
Middle.East
...
2013-01-15
>4
A/chicken/Israel/74/2013
ATGGAAATAATATCACTGATGACTGTACTACTAGTAGTAACAACAA...
NaN
NaN
NaN
NaN
NaN
1680
KF918708
Avian
chicken
Poultry
Poultry
Domestic animal
Domestic
D
Chicken
Galliformes
Middle.East
...
2013-04-15
>4
A/chicken/Israel/502/2013
ATGGAAGCAATATCACTGATGACTATACTACTGGTGGTAACAACAA...
NaN
NaN
NaN
NaN
NaN
1680
KJ128362
Avian
pigeon
?
Columbiformes
Wild bird
Wild
W
Other
NaN
E.Asia.E.China
...
2013-04-15
>4
A/pigeon/Shanghai/JC1/2013
ATGGAAGTAGTATCACTAATAACTATACTACTAGTAGCAACAGTAA...
NaN
NaN
NaN
NaN
NaN
1683
AF156378
Avian
?
Galliformes
quail
Domestic animal
Domestic
D
Quail
Galliformes
China.Central
...
1997-06-15
>4
A/Quail/Hong Kong/G1/97
ATGGAAACAATATCGCTAATAACTATACTACTAGTAGTAACAGCAA...
NaN
NaN
NaN
NaN
NaN
1629
AF156380
Avian
Poultry
Poultry
chicken
Domestic animal
Domestic
D
Chicken
Galliformes
E.Asia.E.China
...
1994-06-15
>4
A/chicken/Beijing/1/1994
ATGGAAACAATATCACTAATAACTATACTACTAGTAGTAACAGCAA...
NaN
NaN
NaN
NaN
NaN
1660
AF461532
Avian
Poultry
Poultry
chicken
Domestic animal
Domestic
D
Chicken
Galliformes
E.Asia.E.China
...
1998-06-15
>4
A/Chicken/Shanghai/F/98
ATGGAAACAATATCACTAATAGCTATACTACTAGTAGTAACAGTAA...
NaN
NaN
NaN
NaN
NaN
1683
638 rows × 27 columns
In [3]:
# From the data, pull out accession and sequence, and store as a list of SeqRecords.
sequences = []
for row in data.iterrows():
sequence = SeqRecord(Seq(row[1]['Trimmed Sequence*']),
id=row[0] + '_' + str(row[1]['HostType_Code1S']) + '_' + str(row[1]['Geo_Code']) + '_' + str(row[1]['HostOrder_Nic']))
sequences.append(sequence)
In [4]:
# sequences
In [5]:
# # Function to find longest ORFs:
# def longest_orfs(list_of_seqrecords):
# aa_sequences = []
# for i, record in enumerate(list_of_seqrecords):
# # print(i, record.seq)
# longest_protein = SeqRecord(id=record.id, seq='')
# for frame in range(3):
# length = 3 * ((len(record) - frame) // 3)
# translation = record.seq[frame:frame + length].translate()
# for pro in translation.split("*"):
# if len(pro) > len(longest_protein.seq):
# longest_protein.seq = pro
# aa_sequences.append(longest_protein)
# return aa_sequences
In [6]:
# # Uncomment this cell if you need to re-write them to disk.
# # Get the longest ORFs from the sequences
# ha_orfs = longest_orfs(sequences)
# # Write the longest ORFS to disk:
# SeqIO.write(ha_orfs, 'H9N2_HA_CDS_all.fasta', 'fasta')
In [7]:
# # Perform multiple sequence alignment using Clustal Omega.
# # Uncomment this cell only if you need to run another multiple sequence alignment.
# gene = 'HA'
# in_file = "H9N2_%s_CDS_all.fasta" % gene
# out_file = "H9N2_%s_CDS_all_Aligned.fasta" % gene
# cline = ClustalOmegaCommandline(infile=in_file, outfile=out_file, verbose=True, auto=True, force=True)
# cline()
In [8]:
# Read in the aligned sequences
gene = "HA"
genes = [s for s in AlignIO.read('H9N2_%s_CDS_all_Aligned.fasta' % gene, 'fasta') if 'nan' not in s.id]
genes
Out[8]:
[SeqRecord(seq=Seq('METKALIAILLMVTTSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY031275_D_China.Central_Galliformes', name='CY031275_D_China.Central_Galliformes', description='CY031275_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METTTLIAILLMVTASNADKICIGYQSTNSTETVDTLMENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='KF188339_W_N.Amer_Anseriformes', name='KF188339_W_N.Amer_Anseriformes', description='KF188339_W_N.Amer_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METIAPIAILLMVTAGNADKICIGHQSTNSTETVDTLTENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='KF188287_D_Europe_Galliformes', name='KF188287_D_Europe_Galliformes', description='KF188287_D_Europe_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITTLIAILLMVTASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY005919_W_N.Amer_Anseriformes', name='CY005919_W_N.Amer_Anseriformes', description='CY005919_W_N.Amer_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITTLVAILLMVTASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY101406_W_N.Amer_Charadriiformes', name='CY101406_W_N.Amer_Charadriiformes', description='CY101406_W_N.Amer_Charadriiformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITTLVAILLMVTASNADKICIGYQSTNSTETVDTLIESNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY005986_W_N.Amer_Charadriiformes', name='CY005986_W_N.Amer_Charadriiformes', description='CY005986_W_N.Amer_Charadriiformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITTLVAILIMVTASNADKICIGYQSTNSTETVDTLIESNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY101507_W_N.Amer_Charadriiformes', name='CY101507_W_N.Amer_Charadriiformes', description='CY101507_W_N.Amer_Charadriiformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITALIAILLVTTTSNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='AB303077_W_Europe_Anseriformes', name='AB303077_W_Europe_Anseriformes', description='AB303077_W_Europe_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVITASSADKICIGYQSTNSTETVDTLIESNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='AF156379_D_China.Central_Galliformes', name='AF156379_D_China.Central_Galliformes', description='AF156379_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIALIAILLVTTTSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='HE802066_W_Europe_Anseriformes', name='HE802066_W_Europe_Anseriformes', description='HE802066_W_Europe_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIALIAILLVTTTSNADKICIGYQSTNSTETVDTLTENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='JX273569_D_Europe_Galliformes', name='JX273569_D_Europe_Galliformes', description='JX273569_D_Europe_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METRTLIAALLIVTTSNADKICIGYQSTNSTETVDTLIETNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY102188_W_N.Amer_Charadriiformes', name='CY102188_W_N.Amer_Charadriiformes', description='CY102188_W_N.Amer_Charadriiformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METTSLITILLLVTTSNADKICIGYQSTNSTETVDTLAENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='DQ064377_D_E.Asia.E.China_Galliformes', name='DQ064377_D_E.Asia.E.China_Galliformes', description='DQ064377_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIALIAILVVTKTSNADKICIGYQSTNSTETVDTLVENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='GU053186_D_E.Asia.E.China_Galliformes', name='GU053186_D_E.Asia.E.China_Galliformes', description='GU053186_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAVSLITILLVVTASNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='AB432938_D_China.Central_Anseriformes', name='AB432938_D_China.Central_Anseriformes', description='AB432938_D_China.Central_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAVSLITILLVVTASNADKICIGYQSTNSTETVGTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='DQ064360_D_China.Central_Galliformes', name='DQ064360_D_China.Central_Galliformes', description='DQ064360_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEATAIITILLVITASYADKICIGYQSTNSTETVDTLTETNVPVTHTKDLLHTE...---', SingleLetterAlphabet()), id='JQ344328_D_SE.Asia_Anseriformes', name='JQ344328_D_SE.Asia_Anseriformes', description='JQ344328_D_SE.Asia_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEQVSLITILLVVTASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF800947_D_Middle.East_Galliformes', name='KF800947_D_Middle.East_Galliformes', description='KF800947_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHARELLHTE...---', SingleLetterAlphabet()), id='AF461510_D_E.Asia.E.China_Galliformes', name='AF461510_D_E.Asia.E.China_Galliformes', description='AF461510_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLIAILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='AY743216_D_E.Asia.E.China_Galliformes', name='AY743216_D_E.Asia.E.China_Galliformes', description='AY743216_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY081264_D_Middle.East_Galliformes', name='CY081264_D_Middle.East_Galliformes', description='CY081264_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITILLVVTASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='FJ794817_D_Middle.East_Galliformes', name='FJ794817_D_Middle.East_Galliformes', description='FJ794817_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METTSLLTILLVVTTSNADKICIGHQSTNSTETVDTLTETNIPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JQ419725_D_Middle.East_Galliformes', name='JQ419725_D_Middle.East_Galliformes', description='JQ419725_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEQVSLITILLVVTASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GQ497118_D_Middle.East_Galliformes', name='GQ497118_D_Middle.East_Galliformes', description='GQ497118_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLIVTAGNADKICIGYQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='AF461512_D_China.West_Galliformes', name='AF461512_D_China.West_Galliformes', description='AF461512_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITIILVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='AF461528_D_China.West_Galliformes', name='AF461528_D_China.West_Galliformes', description='AF461528_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METRSLITILLVVTASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='AF508556_D_S.Asia_Galliformes', name='AF508556_D_S.Asia_Galliformes', description='AF508556_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTASNADKICIGYQSTNSTETVDTLTESNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='AF508568_D_China.West_Galliformes', name='AF508568_D_China.West_Galliformes', description='AF508568_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTASNADKICIGYQSTNSTETVDTLTESNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='AF508571_D_E.Asia.E.China_Galliformes', name='AF508571_D_E.Asia.E.China_Galliformes', description='AF508571_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METRSLITILLVVTASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='AJ291392_D_S.Asia_Galliformes', name='AJ291392_D_S.Asia_Galliformes', description='AJ291392_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVLSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='AY036880_D_China.Central_Galliformes', name='AY036880_D_China.Central_Galliformes', description='AY036880_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLMTILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='DQ064375_D_China.West_Galliformes', name='DQ064375_D_China.West_Galliformes', description='DQ064375_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='DQ227352_D_China.West_Galliformes', name='DQ227352_D_China.West_Galliformes', description='DQ227352_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITIPLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EF070733_D_China.West_Galliformes', name='EF070733_D_China.West_Galliformes', description='EF070733_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTASNADKICIGYQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GU053201_D_Middle.East_Galliformes', name='GU053201_D_Middle.East_Galliformes', description='GU053201_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METRSLITILLVVTASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF188299_D_S.Asia_Galliformes', name='KF188299_D_S.Asia_Galliformes', description='KF188299_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLMTILLVVTASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GQ497120_D_Middle.East_Galliformes', name='GQ497120_D_Middle.East_Galliformes', description='GQ497120_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLMTILLVVTASNADKICIGPYHTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GQ497119_D_Middle.East_Galliformes', name='GQ497119_D_Middle.East_Galliformes', description='GQ497119_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY006021_W_E.Asia.E.China_Anseriformes', name='CY006021_W_E.Asia.E.China_Anseriformes', description='CY006021_W_E.Asia.E.China_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVVTVSNADKFCIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='DQ485208_D_China.Central_Galliformes', name='DQ485208_D_China.Central_Galliformes', description='DQ485208_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEATILITILLVVTASNADKICIGYQSTNSTETVDTLIETNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY102633_W_N.Amer_Charadriiformes', name='CY102633_W_N.Amer_Charadriiformes', description='CY102633_W_N.Amer_Charadriiformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTASNADKICIGYQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='AY738451_D_Middle.East_Galliformes', name='AY738451_D_Middle.East_Galliformes', description='AY738451_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLIAILLVVTVSNADKICIGYQSTNSTETVDTLTESNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='AF461515_D_E.Asia.E.China_Galliformes', name='AF461515_D_E.Asia.E.China_Galliformes', description='AF461515_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='AF461518_D_E.Asia.E.China_Galliformes', name='AF461518_D_E.Asia.E.China_Galliformes', description='AF461518_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAEELLHTE...---', SingleLetterAlphabet()), id='AF461519_D_E.Asia.E.China_Galliformes', name='AF461519_D_E.Asia.E.China_Galliformes', description='AF461519_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLAVTISNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='AF461523_D_E.Asia.E.China_Galliformes', name='AF461523_D_E.Asia.E.China_Galliformes', description='AF461523_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITIILVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='AF461529_D_China.West_Galliformes', name='AF461529_D_China.West_Galliformes', description='AF461529_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='AF461531_D_E.Asia.E.China_Galliformes', name='AF461531_D_E.Asia.E.China_Galliformes', description='AF461531_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAVSLITILLVVTASNADKICISYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='AY513715_D_E.Asia.E.China_Galliformes', name='AY513715_D_E.Asia.E.China_Galliformes', description='AY513715_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MKVVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY023976_D_China.Central_Galliformes', name='CY023976_D_China.Central_Galliformes', description='CY023976_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVVTIGNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY024568_D_China.Central_Galliformes', name='CY024568_D_China.Central_Galliformes', description='CY024568_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MKVVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY024576_D_China.Central_Galliformes', name='CY024576_D_China.Central_Galliformes', description='CY024576_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTASTADKICIGYQSTNSTETVDTLTESNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='DQ064355_D_E.Asia.E.China_Galliformes', name='DQ064355_D_E.Asia.E.China_Galliformes', description='DQ064355_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='DQ064368_D_China.Central_Galliformes', name='DQ064368_D_China.Central_Galliformes', description='DQ064368_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVLLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='DQ064372_D_E.Asia.E.China_Galliformes', name='DQ064372_D_E.Asia.E.China_Galliformes', description='DQ064372_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EF063510_D_Middle.East_Galliformes', name='EF063510_D_Middle.East_Galliformes', description='EF063510_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EF063511_D_Middle.East_Galliformes', name='EF063511_D_Middle.East_Galliformes', description='EF063511_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EF063512_D_Middle.East_Galliformes', name='EF063512_D_Middle.East_Galliformes', description='EF063512_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTASNADKICIGYQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EF492221_D_Middle.East_Galliformes', name='EF492221_D_Middle.East_Galliformes', description='EF492221_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIALIAILVVTETSNADKICIGYQSTNSTETVDTLVENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='EF620900_D_E.Asia.E.China_Galliformes', name='EF620900_D_E.Asia.E.China_Galliformes', description='EF620900_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLMTILLVVTASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EU477248_D_Middle.East_Galliformes', name='EU477248_D_Middle.East_Galliformes', description='EU477248_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLMTILLVVTAGNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EU477249_D_Middle.East_Galliformes', name='EU477249_D_Middle.East_Galliformes', description='EU477249_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEQVSLMTILLVVTASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GQ497122_D_Middle.East_Galliformes', name='GQ497122_D_Middle.East_Galliformes', description='GQ497122_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLMTILLVVTASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GQ497123_D_Middle.East_Galliformes', name='GQ497123_D_Middle.East_Galliformes', description='GQ497123_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY006023_D_E.Asia.E.China_Galliformes', name='CY006023_D_E.Asia.E.China_Galliformes', description='CY006023_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLYTE...---', SingleLetterAlphabet()), id='AB256674_D_E.Asia.E.China_Galliformes', name='AB256674_D_E.Asia.E.China_Galliformes', description='AB256674_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLIPILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='AB256690_D_E.Asia.E.China_Galliformes', name='AB256690_D_E.Asia.E.China_Galliformes', description='AB256690_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='AB256738_D_E.Asia.E.China_Galliformes', name='AB256738_D_E.Asia.E.China_Galliformes', description='AB256738_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVISLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='AB256746_D_E.Asia.E.China_Galliformes', name='AB256746_D_E.Asia.E.China_Galliformes', description='AB256746_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLAVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='AF461524_D_E.Asia.E.China_Galliformes', name='AF461524_D_E.Asia.E.China_Galliformes', description='AF461524_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METLSLTTILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY023104_D_China.Central_Galliformes', name='CY023104_D_China.Central_Galliformes', description='CY023104_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METLSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY023920_D_China.Central_Anseriformes', name='CY023920_D_China.Central_Anseriformes', description='CY023920_D_China.Central_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY024696_D_China.Central_Galliformes', name='CY024696_D_China.Central_Galliformes', description='CY024696_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METLSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY024704_D_China.Central_Galliformes', name='CY024704_D_China.Central_Galliformes', description='CY024704_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METLSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY024712_D_China.Central_Galliformes', name='CY024712_D_China.Central_Galliformes', description='CY024712_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEATAIITILLVITASYADKICIGYQSTNSTETVDTLTETNVPVTHTKDLLHTE...---', SingleLetterAlphabet()), id='CY073800_D_SE.Asia_Anseriformes', name='CY073800_D_SE.Asia_Anseriformes', description='CY073800_D_SE.Asia_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVATVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='DQ064367_D_E.Asia.E.China_Galliformes', name='DQ064367_D_E.Asia.E.China_Galliformes', description='DQ064367_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLIAILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='DQ681216_D_E.Asia.E.China_Anseriformes', name='DQ681216_D_E.Asia.E.China_Anseriformes', description='DQ681216_D_E.Asia.E.China_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EF063513_D_Middle.East_Galliformes', name='EF063513_D_Middle.East_Galliformes', description='EF063513_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EF063514_D_Middle.East_Galliformes', name='EF063514_D_Middle.East_Galliformes', description='EF063514_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLLVTASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EF154917_D_China.Central_Galliformes', name='EF154917_D_China.Central_Galliformes', description='EF154917_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVIASNADKICIGHQSTNSTETVDTLTETNVPVTHAQELLHTE...---', SingleLetterAlphabet()), id='EF154922_D_China.Central_Galliformes', name='EF154922_D_China.Central_Galliformes', description='EF154922_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EF154923_D_China.Central_Galliformes', name='EF154923_D_China.Central_Galliformes', description='EF154923_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EF154924_D_China.Central_Galliformes', name='EF154924_D_China.Central_Galliformes', description='EF154924_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METTPLMTILLMVTAINADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EF154925_D_China.Central_Galliformes', name='EF154925_D_China.Central_Galliformes', description='EF154925_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTASNADKICIGYQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EF492233_D_Middle.East_Galliformes', name='EF492233_D_Middle.East_Galliformes', description='EF492233_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIALIAILLVTTTSNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='EF541419_D_SE.Asia_Anseriformes', name='EF541419_D_SE.Asia_Anseriformes', description='EF541419_D_SE.Asia_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIAIIAILLVTTTSNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='EF541420_D_SE.Asia_Anseriformes', name='EF541420_D_SE.Asia_Anseriformes', description='EF541420_D_SE.Asia_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIALIAILVVTGTSDADKICIGYQSTNSTETVDTLVENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='EU253561_D_E.Asia.E.China_Galliformes', name='EU253561_D_E.Asia.E.China_Galliformes', description='EU253561_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEATSLITILLLVTTSNADKICIGYQSTNPTETVDTLAENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='FJ190132_D_E.Asia.E.China_Galliformes', name='FJ190132_D_E.Asia.E.China_Galliformes', description='FJ190132_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MKTIALIAILLRAIAGNADKICIGYQSTNSTETVDTLTENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='JX273541_D_Europe_Galliformes', name='JX273541_D_Europe_Galliformes', description='JX273541_D_Europe_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF188352_D_Middle.East_Galliformes', name='KF188352_D_Middle.East_Galliformes', description='KF188352_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF188377_D_E.Asia.E.China_Anseriformes', name='KF188377_D_E.Asia.E.China_Anseriformes', description='KF188377_D_E.Asia.E.China_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLMTILLVVTASNADKICIGHQSTNSTETVDTLTETNIPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GQ497124_D_Middle.East_Galliformes', name='GQ497124_D_Middle.East_Galliformes', description='GQ497124_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTASNADKICIGYQSTNSTETVDTLTETNVPVTHAKELIHTE...---', SingleLetterAlphabet()), id='AY738454_D_Middle.East_Galliformes', name='AY738454_D_Middle.East_Galliformes', description='AY738454_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GU471884_D_China.Central_Galliformes', name='GU471884_D_China.Central_Galliformes', description='GU471884_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEATILITILLVVTTSNADKICIGYQSTNSTETVDTLIETNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY144389_W_N.Amer_Charadriiformes', name='CY144389_W_N.Amer_Charadriiformes', description='CY144389_W_N.Amer_Charadriiformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEATILITILLVVTTSNADKICIGYQSTNSTETVDTLIETNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY144397_W_N.Amer_Charadriiformes', name='CY144397_W_N.Amer_Charadriiformes', description='CY144397_W_N.Amer_Charadriiformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVVTISNADKICIGYQSTNSTETVDTLTENNVPVTHARELLHTE...---', SingleLetterAlphabet()), id='AB256714_D_E.Asia.E.China_Galliformes', name='AB256714_D_E.Asia.E.China_Galliformes', description='AB256714_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='AY949989_D_E.Asia.E.China_Galliformes', name='AY949989_D_E.Asia.E.China_Galliformes', description='AY949989_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEALSPITILLVVAVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHAE...---', SingleLetterAlphabet()), id='CY023848_D_China.West_Galliformes', name='CY023848_D_China.West_Galliformes', description='CY023848_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTASNADKFCIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY076723_D_Middle.East_Galliformes', name='CY076723_D_Middle.East_Galliformes', description='CY076723_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLIAILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='DQ997451_D_E.Asia.E.China_Anseriformes', name='DQ997451_D_E.Asia.E.China_Anseriformes', description='DQ997451_D_E.Asia.E.China_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EF063515_D_Middle.East_Galliformes', name='EF063515_D_Middle.East_Galliformes', description='EF063515_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTASNADKICIGYQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EF492229_D_Middle.East_Galliformes', name='EF492229_D_Middle.East_Galliformes', description='EF492229_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLMTILLVVTASNADKICIGHQSTNSTETVDTLTETNIPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EU477246_D_Middle.East_Galliformes', name='EU477246_D_Middle.East_Galliformes', description='EU477246_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLIAILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='FJ384751_D_E.Asia.E.China_Galliformes', name='FJ384751_D_E.Asia.E.China_Galliformes', description='FJ384751_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTASNADKICIGYQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GU050554_D_Middle.East_Galliformes', name='GU050554_D_Middle.East_Galliformes', description='GU050554_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITALIAILLMTTTSNADKICIGYQSTNSTETVDTLTENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='JX273565_W_Europe_Charadriiformes', name='JX273565_W_Europe_Charadriiformes', description='JX273565_W_Europe_Charadriiformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEQVSLMTVLLVATASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GQ497125_D_Middle.East_Galliformes', name='GQ497125_D_Middle.East_Galliformes', description='GQ497125_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLMTILLVATASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GQ497126_D_Middle.East_Galliformes', name='GQ497126_D_Middle.East_Galliformes', description='GQ497126_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLLVTTSNADKICIGYQSTNSTETVDTLAENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JF916721_D_E.Asia.E.China_Anseriformes', name='JF916721_D_E.Asia.E.China_Anseriformes', description='JF916721_D_E.Asia.E.China_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLIIILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY068643_D_S.Asia_Galliformes', name='CY068643_D_S.Asia_Galliformes', description='CY068643_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GQ497128_D_Middle.East_Galliformes', name='GQ497128_D_Middle.East_Galliformes', description='GQ497128_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLIIILLVVTTSNADKICIVHQSTNSTETVNTLTETNVPVTYAKELLHTE...---', SingleLetterAlphabet()), id='EU665420_D_S.Asia_Galliformes', name='EU665420_D_S.Asia_Galliformes', description='EU665420_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLIIILLVVTTSNADKICIGHQSTNSTETVNTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EU665421_D_S.Asia_Galliformes', name='EU665421_D_S.Asia_Galliformes', description='EU665421_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METIALIAILL--TASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY004420_W_N.Amer_Charadriiformes', name='CY004420_W_N.Amer_Charadriiformes', description='CY004420_W_N.Amer_Charadriiformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METIALIAILL--TASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY102720_W_N.Amer_Charadriiformes', name='CY102720_W_N.Amer_Charadriiformes', description='CY102720_W_N.Amer_Charadriiformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METIALIAILLSTTASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY005992_W_N.Amer_Charadriiformes', name='CY005992_W_N.Amer_Charadriiformes', description='CY005992_W_N.Amer_Charadriiformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METIALIAILLSATASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY144515_W_N.Amer_Charadriiformes', name='CY144515_W_N.Amer_Charadriiformes', description='CY144515_W_N.Amer_Charadriiformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METIALIAILLSATASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY144373_W_N.Amer_Charadriiformes', name='CY144373_W_N.Amer_Charadriiformes', description='CY144373_W_N.Amer_Charadriiformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METIALIAILLSATASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY144473_W_N.Amer_Charadriiformes', name='CY144473_W_N.Amer_Charadriiformes', description='CY144473_W_N.Amer_Charadriiformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METIALIAILLSATASNADKICIGYQSTNSTETVDTLTENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY144523_W_N.Amer_Charadriiformes', name='CY144523_W_N.Amer_Charadriiformes', description='CY144523_W_N.Amer_Charadriiformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METIALIAILLSTTASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY144539_W_N.Amer_Charadriiformes', name='CY144539_W_N.Amer_Charadriiformes', description='CY144539_W_N.Amer_Charadriiformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METIALIAILLSTTASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY144547_W_N.Amer_Charadriiformes', name='CY144547_W_N.Amer_Charadriiformes', description='CY144547_W_N.Amer_Charadriiformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METIALIAILLSTTASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY144563_W_N.Amer_Charadriiformes', name='CY144563_W_N.Amer_Charadriiformes', description='CY144563_W_N.Amer_Charadriiformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVIALIAILVVTGTSNADKICIGYQSTNSTETVDTLVENNVPVTHAKELLQTE...---', SingleLetterAlphabet()), id='AY790313_D_E.Asia.E.China_Galliformes', name='AY790313_D_E.Asia.E.China_Galliformes', description='AY790313_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEILALIAILVVTGTGNADKICIGYQSTNSTETVDTLVENNVPVTHTKELLHTG...---', SingleLetterAlphabet()), id='AY862599_D_E.Asia.E.China_Galliformes', name='AY862599_D_E.Asia.E.China_Galliformes', description='AY862599_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIALIAILVVTGTGNADKICIGYQSTNSTETVDTLVENNVPVTHTKELLHTG...---', SingleLetterAlphabet()), id='AY862606_D_E.Asia.E.China_Galliformes', name='AY862606_D_E.Asia.E.China_Galliformes', description='AY862606_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MKALSPITILLVVAVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHAE...---', SingleLetterAlphabet()), id='CY023872_D_China.West_Galliformes', name='CY023872_D_China.West_Galliformes', description='CY023872_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MKALSPITILLVVAVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHAE...---', SingleLetterAlphabet()), id='CY023880_D_China.West_Galliformes', name='CY023880_D_China.West_Galliformes', description='CY023880_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLIAILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='DQ681203_D_E.Asia.E.China_Anseriformes', name='DQ681203_D_E.Asia.E.China_Anseriformes', description='DQ681203_D_E.Asia.E.China_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EF063516_D_Middle.East_Galliformes', name='EF063516_D_Middle.East_Galliformes', description='EF063516_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLMTILLVATASNADKICIGHQSTNSTETVDTLTETNIPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EF063725_D_Middle.East_Galliformes', name='EF063725_D_Middle.East_Galliformes', description='EF063725_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLMTILLVVTASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EF063726_D_Middle.East_Galliformes', name='EF063726_D_Middle.East_Galliformes', description='EF063726_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLMTILLVATASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='FN600115_W_Middle.East_Anseriformes', name='FN600115_W_Middle.East_Anseriformes', description='FN600115_W_Middle.East_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVGTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='HM008896_D_E.Asia.E.China_Galliformes', name='HM008896_D_E.Asia.E.China_Galliformes', description='HM008896_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='HM008897_D_E.Asia.E.China_Galliformes', name='HM008897_D_E.Asia.E.China_Galliformes', description='HM008897_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METTSLITILLLVTTSNADKICIGYQSTNSTETVDTLAENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='HM008898_D_E.Asia.E.China_Galliformes', name='HM008898_D_E.Asia.E.China_Galliformes', description='HM008898_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLIIILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JX273542_D_S.Asia_Galliformes', name='JX273542_D_S.Asia_Galliformes', description='JX273542_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MKTISLITILLVITTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JX273552_D_S.Asia_Galliformes', name='JX273552_D_S.Asia_Galliformes', description='JX273552_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JX273553_D_S.Asia_Galliformes', name='JX273553_D_S.Asia_Galliformes', description='JX273553_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METIALIAILLSTTASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='KF188256_W_N.Amer_Charadriiformes', name='KF188256_W_N.Amer_Charadriiformes', description='KF188256_W_N.Amer_Charadriiformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METIALIAILLSTTASNADKICIGYQSTNSTETVDTLMENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='KF188278_W_N.Amer_Charadriiformes', name='KF188278_W_N.Amer_Charadriiformes', description='KF188278_W_N.Amer_Charadriiformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITMLLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF188304_D_China.Central_Galliformes', name='KF188304_D_China.Central_Galliformes', description='KF188304_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLMTILLVATASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GQ497127_D_Middle.East_Galliformes', name='GQ497127_D_Middle.East_Galliformes', description='GQ497127_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MKVVSLITILLAVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='AB634251_D_E.Asia.E.China_Galliformes', name='AB634251_D_E.Asia.E.China_Galliformes', description='AB634251_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF746785_D_E.Asia.E.China_Galliformes', name='KF746785_D_E.Asia.E.China_Galliformes', description='KF746785_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METIPLMTILLMVTVINADKICIGYQSTNSTETVDTLTETNVPVTQAKELLHTE...---', SingleLetterAlphabet()), id='CY024320_D_China.Central_Galliformes', name='CY024320_D_China.Central_Galliformes', description='CY024320_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIALIAILVVTGTSNADKICIGYQSTNSTETVDTLVETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='DQ464352_D_E.Asia.E.China_Galliformes', name='DQ464352_D_E.Asia.E.China_Galliformes', description='DQ464352_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='DQ465400_D_China.Central_Anseriformes', name='DQ465400_D_China.Central_Anseriformes', description='DQ465400_D_China.Central_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVIALIAILGVTGTSNADKICIGYQSTNSTETVDTLVETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='DQ885991_D_E.Asia.E.China_Galliformes', name='DQ885991_D_E.Asia.E.China_Galliformes', description='DQ885991_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MKTISLITILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHARELLHTE...---', SingleLetterAlphabet()), id='EF063729_D_Middle.East_Galliformes', name='EF063729_D_Middle.East_Galliformes', description='EF063729_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLMTILLVATASNADKICIGHQSTNSTETVDTLTETNVPVTDAKELLHTE...---', SingleLetterAlphabet()), id='EF063730_D_Middle.East_Galliformes', name='EF063730_D_Middle.East_Galliformes', description='EF063730_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MKTISLITILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EF063731_D_Middle.East_Galliformes', name='EF063731_D_Middle.East_Galliformes', description='EF063731_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLISTASNADKICIGYQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EF492242_D_Middle.East_Galliformes', name='EF492242_D_Middle.East_Galliformes', description='EF492242_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVIALIAILVVTGTSNADKICIGYQSTNSTETVDTLVETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EU662946_D_E.Asia.E.China_Galliformes', name='EU662946_D_E.Asia.E.China_Galliformes', description='EU662946_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVIALIAILVVTGTSNADKICIGYQSTNSTETVDTLVETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EU662947_D_E.Asia.E.China_Galliformes', name='EU662947_D_E.Asia.E.China_Galliformes', description='EU662947_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLISTASNADKICIGYQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JX273537_D_Middle.East_Anseriformes', name='JX273537_D_Middle.East_Anseriformes', description='JX273537_D_Middle.East_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLLVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JX273545_D_Middle.East_Galliformes', name='JX273545_D_Middle.East_Galliformes', description='JX273545_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLISTASNADKICIGYQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JX273546_D_Middle.East_Galliformes', name='JX273546_D_Middle.East_Galliformes', description='JX273546_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVIALIAILVVTGTSNADKICIGYQSTNSTETVDTLVETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF188395_D_E.Asia.E.China_Galliformes', name='KF188395_D_E.Asia.E.China_Galliformes', description='KF188395_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF188399_D_S.Asia_Galliformes', name='KF188399_D_S.Asia_Galliformes', description='KF188399_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF746835_D_E.Asia.E.China_Galliformes', name='KF746835_D_E.Asia.E.China_Galliformes', description='KF746835_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTQAKELLHTE...---', SingleLetterAlphabet()), id='CY038410_D_S.Asia_Galliformes', name='CY038410_D_S.Asia_Galliformes', description='CY038410_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METLSIITILLVITVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY023416_D_China.Central_Galliformes', name='CY023416_D_China.Central_Galliformes', description='CY023416_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLIVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY023424_D_China.Central_Galliformes', name='CY023424_D_China.Central_Galliformes', description='CY023424_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY023608_D_E.Asia.E.China_Galliformes', name='CY023608_D_E.Asia.E.China_Galliformes', description='CY023608_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITMLLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY023680_D_E.Asia.E.China_Galliformes', name='CY023680_D_E.Asia.E.China_Galliformes', description='CY023680_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METIPLMTILLMVTAINADKICIGYQSTNSTETVDTLTETNVPVTQAKELLHTE...---', SingleLetterAlphabet()), id='CY024504_D_China.Central_Galliformes', name='CY024504_D_China.Central_Galliformes', description='CY024504_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MKITALIAILLVTTTSNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY043856_W_Europe_Anseriformes', name='CY043856_W_Europe_Anseriformes', description='CY043856_W_Europe_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EF063733_D_Middle.East_Galliformes', name='EF063733_D_Middle.East_Galliformes', description='EF063733_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EF063734_D_Middle.East_Galliformes', name='EF063734_D_Middle.East_Galliformes', description='EF063734_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EF154968_D_China.Central_Galliformes', name='EF154968_D_China.Central_Galliformes', description='EF154968_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METIPLMTILLMVTAINADKICIGYQSTNSTETVDTLTETNVPVTQAKELLHTE...---', SingleLetterAlphabet()), id='EF154976_D_China.Central_Galliformes', name='EF154976_D_China.Central_Galliformes', description='EF154976_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLISTASNADKICIGYQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EF492222_D_Middle.East_Galliformes', name='EF492222_D_Middle.East_Galliformes', description='EF492222_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLISTASNADKICIGYQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EF492225_D_Middle.East_Galliformes', name='EF492225_D_Middle.East_Galliformes', description='EF492225_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLISTASNADKICIGYQSTNSTETVDTLTETNVPVTHAKELLHAE...---', SingleLetterAlphabet()), id='EF492230_D_Middle.East_Galliformes', name='EF492230_D_Middle.East_Galliformes', description='EF492230_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLISTAINADKICIGYQSTNSTEAVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EF492234_D_Middle.East_Galliformes', name='EF492234_D_Middle.East_Galliformes', description='EF492234_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLISTAINADKICIGYQSTNSTEAVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EF492236_D_Middle.East_Galliformes', name='EF492236_D_Middle.East_Galliformes', description='EF492236_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JX273556_D_Middle.East_Galliformes', name='JX273556_D_Middle.East_Galliformes', description='JX273556_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF188254_D_Middle.East_Galliformes', name='KF188254_D_Middle.East_Galliformes', description='KF188254_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVVATSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF188325_D_S.Asia_Galliformes', name='KF188325_D_S.Asia_Galliformes', description='KF188325_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MGTTSLITILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF188337_W_Middle.East_Charadriiformes', name='KF188337_W_Middle.East_Charadriiformes', description='KF188337_W_Middle.East_Charadriiformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF188347_D_S.Asia_Galliformes', name='KF188347_D_S.Asia_Galliformes', description='KF188347_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVVATSNADKICVGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF188359_D_S.Asia_Galliformes', name='KF188359_D_S.Asia_Galliformes', description='KF188359_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF188371_W_Middle.East_Charadriiformes', name='KF188371_W_Middle.East_Charadriiformes', description='KF188371_W_Middle.East_Charadriiformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLAVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF259064_D_China.Central_Galliformes', name='KF259064_D_China.Central_Galliformes', description='KF259064_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METIALIAILLSTTAINADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY075925_W_N.Amer_Charadriiformes', name='CY075925_W_N.Amer_Charadriiformes', description='CY075925_W_N.Amer_Charadriiformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METTTLIAILLMVTASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='KC209500_W_E.Asia.E.China_Anseriformes', name='KC209500_W_E.Asia.E.China_Anseriformes', description='KC209500_W_E.Asia.E.China_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEQLSLMTILLVVTASNADKICIGHQSTNSTETVDTLTETNIPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GQ497131_D_Middle.East_Galliformes', name='GQ497131_D_Middle.East_Galliformes', description='GQ497131_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY038442_D_S.Asia_Galliformes', name='CY038442_D_S.Asia_Galliformes', description='CY038442_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY038418_D_S.Asia_Galliformes', name='CY038418_D_S.Asia_Galliformes', description='CY038418_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITMLLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GU722360_D_China.Central_Galliformes', name='GU722360_D_China.Central_Galliformes', description='GU722360_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIALIAILVMTGTGNADKICIGYQSTNSTETVDTLVENNVPVTHTKELLRTE...---', SingleLetterAlphabet()), id='GU247915_D_E.Asia.E.China_Galliformes', name='GU247915_D_E.Asia.E.China_Galliformes', description='GU247915_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JN540058_D_S.Asia_Galliformes', name='JN540058_D_S.Asia_Galliformes', description='JN540058_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITMLLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GU722362_D_China.Central_Galliformes', name='GU722362_D_China.Central_Galliformes', description='GU722362_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY038426_D_S.Asia_Galliformes', name='CY038426_D_S.Asia_Galliformes', description='CY038426_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MKTIALIAILLSTTASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY041426_W_N.Amer_Charadriiformes', name='CY041426_W_N.Amer_Charadriiformes', description='CY041426_W_N.Amer_Charadriiformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MKTIALIAILLSTTASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY043912_W_N.Amer_Charadriiformes', name='CY043912_W_N.Amer_Charadriiformes', description='CY043912_W_N.Amer_Charadriiformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MKTIALIAILLSTTASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY041434_W_N.Amer_Charadriiformes', name='CY041434_W_N.Amer_Charadriiformes', description='CY041434_W_N.Amer_Charadriiformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MKTIALIAILLSTTASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY144699_W_N.Amer_Charadriiformes', name='CY144699_W_N.Amer_Charadriiformes', description='CY144699_W_N.Amer_Charadriiformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METTSLITILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GQ497134_D_Middle.East_Galliformes', name='GQ497134_D_Middle.East_Galliformes', description='GQ497134_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITMLLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GU471895_D_China.Central_Galliformes', name='GU471895_D_China.Central_Galliformes', description='GU471895_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITALIAILLVTTTSNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY041266_W_Europe_Anseriformes', name='CY041266_W_Europe_Anseriformes', description='CY041266_W_Europe_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIALIAILLVTTTSNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY043864_W_Europe_Anseriformes', name='CY043864_W_Europe_Anseriformes', description='CY043864_W_Europe_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLISTASNADKICIGYQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EF492224_D_Middle.East_Galliformes', name='EF492224_D_Middle.East_Galliformes', description='EF492224_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MKALSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EU086283_D_E.Asia.E.China_Galliformes', name='EU086283_D_E.Asia.E.China_Galliformes', description='EU086283_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METI----SLIVITVSNADKICIGYLSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EU157934_D_China.West_Galliformes', name='EU157934_D_China.West_Galliformes', description='EU157934_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLLTILLVITVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EU216085_D_China.West_Galliformes', name='EU216085_D_China.West_Galliformes', description='EU216085_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('----METISLLVITVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EU216088_D_China.West_Galliformes', name='EU216088_D_China.West_Galliformes', description='EU216088_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EU573941_D_E.Asia.E.China_Galliformes', name='EU573941_D_E.Asia.E.China_Galliformes', description='EU573941_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIISLMTILLVVTTSNADKICIGYQSTNSTETVDTLTETNVPVTHAKELLHTV...---', SingleLetterAlphabet()), id='FJ464730_D_Middle.East_Galliformes', name='FJ464730_D_Middle.East_Galliformes', description='FJ464730_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITMLLVATVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GQ373075_D_E.Asia.E.China_Galliformes', name='GQ373075_D_E.Asia.E.China_Galliformes', description='GQ373075_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JX273538_D_Middle.East_Anseriformes', name='JX273538_D_Middle.East_Anseriformes', description='JX273538_D_Middle.East_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JX273555_D_Middle.East_Galliformes', name='JX273555_D_Middle.East_Galliformes', description='JX273555_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JX273559_D_Middle.East_Galliformes', name='JX273559_D_Middle.East_Galliformes', description='JX273559_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JX273560_D_Middle.East_Galliformes', name='JX273560_D_Middle.East_Galliformes', description='JX273560_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITALIAILLVTTTSNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='JX273566_W_Europe_Anseriformes', name='JX273566_W_Europe_Anseriformes', description='JX273566_W_Europe_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVVTVSYADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF188375_D_Middle.East_Galliformes', name='KF188375_D_Middle.East_Galliformes', description='KF188375_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIVSLITILLVITVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF259069_D_China.Central_Galliformes', name='KF259069_D_China.Central_Galliformes', description='KF259069_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF259071_D_China.Central_Galliformes', name='KF259071_D_China.Central_Galliformes', description='KF259071_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVITVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF259073_D_China.Central_Galliformes', name='KF259073_D_China.Central_Galliformes', description='KF259073_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSPITILLVITVSNADKICIGYQSTNSTETVDTLIENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF259075_D_China.Central_Galliformes', name='KF259075_D_China.Central_Galliformes', description='KF259075_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY038402_D_S.Asia_Galliformes', name='CY038402_D_S.Asia_Galliformes', description='CY038402_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAASLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAQELLHTE...---', SingleLetterAlphabet()), id='FJ190135_D_E.Asia.E.China_Galliformes', name='FJ190135_D_E.Asia.E.China_Galliformes', description='FJ190135_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MKALSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GU722363_D_China.Central_Galliformes', name='GU722363_D_China.Central_Galliformes', description='GU722363_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEQLSLITILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GQ497133_D_Middle.East_Galliformes', name='GQ497133_D_Middle.East_Galliformes', description='GQ497133_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='FJ464728_D_Middle.East_Galliformes', name='FJ464728_D_Middle.East_Galliformes', description='FJ464728_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='FJ464729_D_Middle.East_Galliformes', name='FJ464729_D_Middle.East_Galliformes', description='FJ464729_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='FJ464714_D_Middle.East_Galliformes', name='FJ464714_D_Middle.East_Galliformes', description='FJ464714_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY038434_D_S.Asia_Galliformes', name='CY038434_D_S.Asia_Galliformes', description='CY038434_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MKTIALIAILLSTTANNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY144763_W_N.Amer_Charadriiformes', name='CY144763_W_N.Amer_Charadriiformes', description='CY144763_W_N.Amer_Charadriiformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY038482_D_S.Asia_Galliformes', name='CY038482_D_S.Asia_Galliformes', description='CY038482_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MKTIALIAILLSTTANNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY077174_W_N.Amer_Charadriiformes', name='CY077174_W_N.Amer_Charadriiformes', description='CY077174_W_N.Amer_Charadriiformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVVTTSIADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY038394_D_S.Asia_Galliformes', name='CY038394_D_S.Asia_Galliformes', description='CY038394_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIALIAILLATTTSNADKICIGYQSTNSTETVDTLMESNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='AB874675_W_E.Asia.E.China_Anseriformes', name='AB874675_W_E.Asia.E.China_Anseriformes', description='AB874675_W_E.Asia.E.China_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITALIAILLVTTTSNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY041274_W_Europe_Anseriformes', name='CY041274_W_Europe_Anseriformes', description='CY041274_W_Europe_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('----METISLLVITVSNADKICIGYQSTNSTETVNTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EU216080_D_China.West_Galliformes', name='EU216080_D_China.West_Galliformes', description='EU216080_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('----METISLLVITVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EU216081_D_China.West_Galliformes', name='EU216081_D_China.West_Galliformes', description='EU216081_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('----METISLLVITVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EU216082_D_China.West_Galliformes', name='EU216082_D_China.West_Galliformes', description='EU216082_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METI----SLIVITVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EU216083_D_China.West_Galliformes', name='EU216083_D_China.West_Galliformes', description='EU216083_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('----METISLLVKTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EU216084_D_China.West_Galliformes', name='EU216084_D_China.West_Galliformes', description='EU216084_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('----METISLLVITVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EU216086_D_China.West_Galliformes', name='EU216086_D_China.West_Galliformes', description='EU216086_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLLNMQLVVTVSNADEICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EU216087_D_China.West_Galliformes', name='EU216087_D_China.West_Galliformes', description='EU216087_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITMLLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EU216089_D_China.West_Galliformes', name='EU216089_D_China.West_Galliformes', description='EU216089_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITMLLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EU216090_D_China.West_Galliformes', name='EU216090_D_China.West_Galliformes', description='EU216090_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLLTMLLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EU216091_D_China.West_Galliformes', name='EU216091_D_China.West_Galliformes', description='EU216091_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLLTMLLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EU216092_D_China.West_Galliformes', name='EU216092_D_China.West_Galliformes', description='EU216092_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MKTISLITILLIVTTSNADKICIGHQSTNSTETVDTLAETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EU477243_D_Middle.East_Galliformes', name='EU477243_D_Middle.East_Galliformes', description='EU477243_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MKTISLITILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EU477539_D_Middle.East_Galliformes', name='EU477539_D_Middle.East_Galliformes', description='EU477539_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITMLLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EU644482_D_China.West_Anseriformes', name='EU644482_D_China.West_Anseriformes', description='EU644482_D_China.West_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITMLLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EU644485_D_China.West_Galliformes', name='EU644485_D_China.West_Galliformes', description='EU644485_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIALIAILLVTTTSNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='FN600116_W_Middle.East_Anseriformes', name='FN600116_W_Middle.East_Anseriformes', description='FN600116_W_Middle.East_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIALIAILLVTTTSNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='FN600117_W_Middle.East_Anseriformes', name='FN600117_W_Middle.East_Anseriformes', description='FN600117_W_Middle.East_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITMLLVVTMSNAGKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='HM008887_D_E.Asia.E.China_Galliformes', name='HM008887_D_E.Asia.E.China_Galliformes', description='HM008887_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLLVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JX273539_D_S.Asia_Galliformes', name='JX273539_D_S.Asia_Galliformes', description='JX273539_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLIIILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTG...---', SingleLetterAlphabet()), id='JX273540_D_S.Asia_Galliformes', name='JX273540_D_S.Asia_Galliformes', description='JX273540_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIALIAILLVTATSSADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='JX273568_W_Europe_Anseriformes', name='JX273568_W_Europe_Anseriformes', description='JX273568_W_Europe_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITMLLVATVINADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF259078_D_China.Central_Galliformes', name='KF259078_D_China.Central_Galliformes', description='KF259078_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVITGSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF259079_D_China.Central_Galliformes', name='KF259079_D_China.Central_Galliformes', description='KF259079_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLIAMLLVVTVSNADKICIGYQSTNSTETVDTLTESNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF259083_D_China.Central_Galliformes', name='KF259083_D_China.Central_Galliformes', description='KF259083_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVITVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF259084_D_China.Central_Galliformes', name='KF259084_D_China.Central_Galliformes', description='KF259084_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVITVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF259089_D_China.Central_Galliformes', name='KF259089_D_China.Central_Galliformes', description='KF259089_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITMLLVVTVSNADKICIGYQSTNSTETVDTLTENNVPATHAKELLHTE...---', SingleLetterAlphabet()), id='GU471799_D_China.West_Galliformes', name='GU471799_D_China.West_Galliformes', description='GU471799_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLMTILLVVTASNADKICIGHQSTNSTETVDTLTETNIPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GQ497135_D_Middle.East_Galliformes', name='GQ497135_D_Middle.East_Galliformes', description='GQ497135_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIALIAILLVTTTSNADKICIGYQSTNSTETVDTLTENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='JF745931_W_Europe_Anseriformes', name='JF745931_W_Europe_Anseriformes', description='JF745931_W_Europe_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIALIVILLVATTSNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='GU194479_W_Europe_Anseriformes', name='GU194479_W_Europe_Anseriformes', description='GU194479_W_Europe_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIALIVILLVTTTSNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='GU194485_W_Europe_Anseriformes', name='GU194485_W_Europe_Anseriformes', description='GU194485_W_Europe_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='FJ190151_D_E.Asia.E.China_Galliformes', name='FJ190151_D_E.Asia.E.China_Galliformes', description='FJ190151_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='FJ190144_D_E.Asia.E.China_Galliformes', name='FJ190144_D_E.Asia.E.China_Galliformes', description='FJ190144_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MAIIVLIVILLVTTTSNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='GU194480_W_Europe_Anseriformes', name='GU194480_W_Europe_Anseriformes', description='GU194480_W_Europe_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIALIVILLVTTTSNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='GU194481_W_Europe_Anseriformes', name='GU194481_W_Europe_Anseriformes', description='GU194481_W_Europe_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVVTTGNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GQ497136_D_Middle.East_Galliformes', name='GQ497136_D_Middle.East_Galliformes', description='GQ497136_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAVSLITMLLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='FJ190137_D_E.Asia.E.China_Galliformes', name='FJ190137_D_E.Asia.E.China_Galliformes', description='FJ190137_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='FJ464726_D_Middle.East_Galliformes', name='FJ464726_D_Middle.East_Galliformes', description='FJ464726_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAASLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAQELLHTE...---', SingleLetterAlphabet()), id='FJ190136_D_E.Asia.E.China_Galliformes', name='FJ190136_D_E.Asia.E.China_Galliformes', description='FJ190136_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GQ120560_D_Middle.East_Galliformes', name='GQ120560_D_Middle.East_Galliformes', description='GQ120560_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GQ120559_D_Middle.East_Galliformes', name='GQ120559_D_Middle.East_Galliformes', description='GQ120559_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAASLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAQELLHTE...---', SingleLetterAlphabet()), id='FJ190149_D_China.West_Galliformes', name='FJ190149_D_China.West_Galliformes', description='FJ190149_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITMLLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GU471894_D_China.Central_Galliformes', name='GU471894_D_China.Central_Galliformes', description='GU471894_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEKTTLIAILLMVTASNADKICIGYQSTNSTETVDTLIETNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='KC693645_W_E.Asia.E.China_Anseriformes', name='KC693645_W_E.Asia.E.China_Anseriformes', description='KC693645_W_E.Asia.E.China_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEKIPLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY038450_D_S.Asia_Galliformes', name='CY038450_D_S.Asia_Galliformes', description='CY038450_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='FJ464727_D_Middle.East_Galliformes', name='FJ464727_D_Middle.East_Galliformes', description='FJ464727_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GQ120561_D_Middle.East_Galliformes', name='GQ120561_D_Middle.East_Galliformes', description='GQ120561_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIVLIVILLVTTTSNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLYTE...---', SingleLetterAlphabet()), id='GU194486_W_Europe_Anseriformes', name='GU194486_W_Europe_Anseriformes', description='GU194486_W_Europe_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVASLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='FJ534538_D_China.Central_Galliformes', name='FJ534538_D_China.Central_Galliformes', description='FJ534538_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIALIVILLVTTTSNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='GU194487_W_Europe_Anseriformes', name='GU194487_W_Europe_Anseriformes', description='GU194487_W_Europe_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JX456177_D_Middle.East_Galliformes', name='JX456177_D_Middle.East_Galliformes', description='JX456177_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAISLMTILLVVTTSNADKICIGHQSTNSTDTVDTLTETNIPVTQAKELLHTE...---', SingleLetterAlphabet()), id='CY038466_D_S.Asia_Galliformes', name='CY038466_D_S.Asia_Galliformes', description='CY038466_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MGKIPLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JN540066_D_S.Asia_Galliformes', name='JN540066_D_S.Asia_Galliformes', description='JN540066_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAISLMTILLVVTTSNADKICIGHQSTNSTDTVDTLTETNIPVTQAKELLHTE...---', SingleLetterAlphabet()), id='CY038474_D_S.Asia_Galliformes', name='CY038474_D_S.Asia_Galliformes', description='CY038474_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAVSLITMLLVATVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='FJ190138_D_E.Asia.E.China_Galliformes', name='FJ190138_D_E.Asia.E.China_Galliformes', description='FJ190138_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLLVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GU064951_D_S.Asia_Galliformes', name='GU064951_D_S.Asia_Galliformes', description='GU064951_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MKTISLITILLVVTTSNADKICIGHQSTNSTETVDTLTETNIPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JX273543_D_Middle.East_Galliformes', name='JX273543_D_Middle.East_Galliformes', description='JX273543_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVITVSNADKICIGYQSTNSTETVNTLTEDNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF188397_D_China.Central_Galliformes', name='KF188397_D_China.Central_Galliformes', description='KF188397_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVPLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF259097_D_China.Central_Galliformes', name='KF259097_D_China.Central_Galliformes', description='KF259097_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITILLIVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF259098_D_China.Central_Galliformes', name='KF259098_D_China.Central_Galliformes', description='KF259098_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GQ120552_D_Middle.East_Galliformes', name='GQ120552_D_Middle.East_Galliformes', description='GQ120552_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVTTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTG...---', SingleLetterAlphabet()), id='KF746867_D_China.Central_Galliformes', name='KF746867_D_China.Central_Galliformes', description='KF746867_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITMLLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GU471880_D_China.Central_Galliformes', name='GU471880_D_China.Central_Galliformes', description='GU471880_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITMLLVATVINADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GU471881_D_China.Central_Galliformes', name='GU471881_D_China.Central_Galliformes', description='GU471881_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIALIVILLVTTTSNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='GU194482_W_Europe_Anseriformes', name='GU194482_W_Europe_Anseriformes', description='GU194482_W_Europe_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITTLIAILLMITASNADKICIGYQSTNSTETVDTLIETNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY079646_W_N.Amer_Anseriformes', name='CY079646_W_N.Amer_Anseriformes', description='CY079646_W_N.Amer_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MKTISLVTILLVVTTSNADKICIGHQSTNSTETVDTLTEANVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GU071967_D_Middle.East_Galliformes', name='GU071967_D_Middle.East_Galliformes', description='GU071967_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MKTISLVTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GU071968_D_Middle.East_Galliformes', name='GU071968_D_Middle.East_Galliformes', description='GU071968_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEATILITILLMVTTSDADKICIGYQSTNSTETVDTLIETNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY157025_W_N.Amer_Anseriformes', name='CY157025_W_N.Amer_Anseriformes', description='CY157025_W_N.Amer_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLIAILLVVTASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JX456179_D_Middle.East_Galliformes', name='JX456179_D_Middle.East_Galliformes', description='JX456179_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLLVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KC757788_D_S.Asia_Anseriformes', name='KC757788_D_S.Asia_Anseriformes', description='KC757788_D_S.Asia_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLLVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KC757967_D_S.Asia_Galliformes', name='KC757967_D_S.Asia_Galliformes', description='KC757967_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVIALIAILVVTGTSNADKICIGYQSTNSTETVDTLVETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GU086234_D_E.Asia.E.China_Galliformes', name='GU086234_D_E.Asia.E.China_Galliformes', description='GU086234_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MKSIVLIAILLVATTSNADKICIGYQSTNSTETVDTLIESNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='AB545591_D_SE.Asia_Anseriformes', name='AB545591_D_SE.Asia_Anseriformes', description='AB545591_D_SE.Asia_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIALIVILLVTTTSNADKICIGYQSTNSTETVDTLTENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='HE802723_W_Europe_Anseriformes', name='HE802723_W_Europe_Anseriformes', description='HE802723_W_Europe_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTTGNADKICVGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JX273549_D_S.Asia_Galliformes', name='JX273549_D_S.Asia_Galliformes', description='JX273549_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METTSLITILLLVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF188249_D_S.Asia_Galliformes', name='KF188249_D_S.Asia_Galliformes', description='KF188249_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVLLITMLLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF259108_D_China.Central_Galliformes', name='KF259108_D_China.Central_Galliformes', description='KF259108_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIALIVILLVTTTSNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY116614_W_Europe_Anseriformes', name='CY116614_W_Europe_Anseriformes', description='CY116614_W_Europe_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIALIVILLVTTTSNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY116616_W_Europe_Anseriformes', name='CY116616_W_Europe_Anseriformes', description='CY116616_W_Europe_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIALIVILLVTTTSNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY116618_W_Europe_Anseriformes', name='CY116618_W_Europe_Anseriformes', description='CY116618_W_Europe_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIALIVILLVTTTSNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY116620_W_Europe_Anseriformes', name='CY116620_W_Europe_Anseriformes', description='CY116620_W_Europe_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METASLITMLLVATVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF746819_D_E.Asia.E.China_Galliformes', name='KF746819_D_E.Asia.E.China_Galliformes', description='KF746819_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLGVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GU471868_D_E.Asia.E.China_Galliformes', name='GU471868_D_E.Asia.E.China_Galliformes', description='GU471868_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITMLLVATVINADEICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GU471870_D_E.Asia.E.China_Galliformes', name='GU471870_D_E.Asia.E.China_Galliformes', description='GU471870_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GU471803_D_China.West_Galliformes', name='GU471803_D_China.West_Galliformes', description='GU471803_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METASLITMLLVATVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY087171_D_China.West_Galliformes', name='CY087171_D_China.West_Galliformes', description='CY087171_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METASLITMLLVATVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY087179_D_China.West_Galliformes', name='CY087179_D_China.West_Galliformes', description='CY087179_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METASLITMLLVATVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY087187_D_China.West_Anseriformes', name='CY087187_D_China.West_Anseriformes', description='CY087187_D_China.West_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITMLLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GU471800_D_China.West_Galliformes', name='GU471800_D_China.West_Galliformes', description='GU471800_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVVTVSNAGKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GU471804_D_China.West_Galliformes', name='GU471804_D_China.West_Galliformes', description='GU471804_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF746843_D_China.Central_Galliformes', name='KF746843_D_China.Central_Galliformes', description='KF746843_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METASLITMLLIATVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF746769_D_E.Asia.E.China_Galliformes', name='KF746769_D_E.Asia.E.China_Galliformes', description='KF746769_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEATILITILLMATTSNADKICIGYQSTNSTETVDTLIETNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY157502_W_N.Amer_Anseriformes', name='CY157502_W_N.Amer_Anseriformes', description='CY157502_W_N.Amer_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEATILITILLMVTTSNADKICIGYQSTNSTETVDTLIETNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY157510_W_N.Amer_Anseriformes', name='CY157510_W_N.Amer_Anseriformes', description='CY157510_W_N.Amer_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNIPVTQAKELLHTE...---', SingleLetterAlphabet()), id='JN540074_D_S.Asia_Galliformes', name='JN540074_D_S.Asia_Galliformes', description='JN540074_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METTTLIAILLMATASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY097630_W_N.Amer_Anseriformes', name='CY097630_W_N.Amer_Anseriformes', description='CY097630_W_N.Amer_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEATILITILLTVATSSADKICIGYQSTNSTETVDTLIETNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY146513_W_N.Amer_Anseriformes', name='CY146513_W_N.Amer_Anseriformes', description='CY146513_W_N.Amer_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLLITTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KC757999_D_S.Asia_Galliformes', name='KC757999_D_S.Asia_Galliformes', description='KC757999_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KC296446_D_China.Central_Galliformes', name='KC296446_D_China.Central_Galliformes', description='KC296446_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAISLMTILLVVTTSNADKICIGHQSTNSTDTVDTLTETNIPVTQAKELLHTE...---', SingleLetterAlphabet()), id='JQ905259_D_S.Asia_Galliformes', name='JQ905259_D_S.Asia_Galliformes', description='JQ905259_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MKSIALIAILLVTTSSNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='AB569975_D_SE.Asia_Anseriformes', name='AB569975_D_SE.Asia_Anseriformes', description='AB569975_D_SE.Asia_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVITTSNADRICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JX273547_D_S.Asia_Galliformes', name='JX273547_D_S.Asia_Galliformes', description='JX273547_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVITTSNADRICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JX273548_D_S.Asia_Galliformes', name='JX273548_D_S.Asia_Galliformes', description='JX273548_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTQAKELLHTE...---', SingleLetterAlphabet()), id='JX273557_D_Middle.East_Galliformes', name='JX273557_D_Middle.East_Galliformes', description='JX273557_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTQAKELLHTE...---', SingleLetterAlphabet()), id='JX273558_D_Middle.East_Galliformes', name='JX273558_D_Middle.East_Galliformes', description='JX273558_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JX448753_D_E.Asia.E.China_Galliformes', name='JX448753_D_E.Asia.E.China_Galliformes', description='JX448753_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVLLITMLLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF259116_D_China.Central_Galliformes', name='KF259116_D_China.Central_Galliformes', description='KF259116_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVITVSNADKICIGYQSTNSTETVNTLTEDNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF259122_D_China.Central_Galliformes', name='KF259122_D_China.Central_Galliformes', description='KF259122_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEATILITILLTVATSSADKICIGYQSTNSTETVDTLIETNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY130453_W_N.Amer_Anseriformes', name='CY130453_W_N.Amer_Anseriformes', description='CY130453_W_N.Amer_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVTLMTILLLITTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTD...---', SingleLetterAlphabet()), id='KC757832_D_S.Asia_Galliformes', name='KC757832_D_S.Asia_Galliformes', description='KC757832_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLLVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KC758060_D_S.Asia_Galliformes', name='KC758060_D_S.Asia_Galliformes', description='KC758060_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEATILITILLTVATSSADKICIGYQSTNSTETVDTLIETNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY125750_W_N.Amer_Anseriformes', name='CY125750_W_N.Amer_Anseriformes', description='CY125750_W_N.Amer_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVTLMTILLLITTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTD...---', SingleLetterAlphabet()), id='KC758030_D_S.Asia_Galliformes', name='KC758030_D_S.Asia_Galliformes', description='KC758030_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEATILITILLTVATSSADKICIGYQSTNSTETVDTLIETNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY125733_W_N.Amer_Anseriformes', name='CY125733_W_N.Amer_Anseriformes', description='CY125733_W_N.Amer_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEATILITILLTVATSSADKICIGYQSTNSTETVDTLTETNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY125758_W_N.Amer_Anseriformes', name='CY125758_W_N.Amer_Anseriformes', description='CY125758_W_N.Amer_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIALIAILLVTTTSHADKICIGYQSTNSTETVDTLTENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='KF591855_D_SE.Asia_Anseriformes', name='KF591855_D_SE.Asia_Anseriformes', description='KF591855_D_SE.Asia_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLMTILLLVTTSNADKICIGHQSTNSTETVDTLTENNVPVTHAKELLHTD...---', SingleLetterAlphabet()), id='KC757951_D_S.Asia_Galliformes', name='KC757951_D_S.Asia_Galliformes', description='KC757951_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVTLMTILLLVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTD...---', SingleLetterAlphabet()), id='KC757991_D_S.Asia_Galliformes', name='KC757991_D_S.Asia_Galliformes', description='KC757991_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METIPLITILLVITTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JX310065_D_S.Asia_Galliformes', name='JX310065_D_S.Asia_Galliformes', description='JX310065_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MATISLITILLVITTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JX310066_D_S.Asia_Galliformes', name='JX310066_D_S.Asia_Galliformes', description='JX310066_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METIPLITILLVITTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JX310067_D_S.Asia_Galliformes', name='JX310067_D_S.Asia_Galliformes', description='JX310067_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVTLMTILLLITTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTD...---', SingleLetterAlphabet()), id='KC757855_D_S.Asia_Galliformes', name='KC757855_D_S.Asia_Galliformes', description='KC757855_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEATILMTILLTVATSSADKICIGYQSTNSTETVDTLIETNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY133373_W_N.Amer_Anseriformes', name='CY133373_W_N.Amer_Anseriformes', description='CY133373_W_N.Amer_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METIPLIAILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JX456180_D_Middle.East_Galliformes', name='JX456180_D_Middle.East_Galliformes', description='JX456180_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEATILITILLTVATSSADKICIGYQSTNSTETVDTLIETNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY133633_W_N.Amer_Anseriformes', name='CY133633_W_N.Amer_Anseriformes', description='CY133633_W_N.Amer_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF800938_D_Middle.East_Galliformes', name='KF800938_D_Middle.East_Galliformes', description='KF800938_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METIPLMAILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JX456182_D_Middle.East_Galliformes', name='JX456182_D_Middle.East_Galliformes', description='JX456182_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JN653611_D_E.Asia.E.China_Galliformes', name='JN653611_D_E.Asia.E.China_Galliformes', description='JN653611_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVTLMTILLLVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTD...---', SingleLetterAlphabet()), id='KC757840_D_S.Asia_Galliformes', name='KC757840_D_S.Asia_Galliformes', description='KC757840_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KJ419947_D_E.Asia.E.China_Galliformes', name='KJ419947_D_E.Asia.E.China_Galliformes', description='KJ419947_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVTLMTILLLVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTD...---', SingleLetterAlphabet()), id='KC758015_D_S.Asia_Galliformes', name='KC758015_D_S.Asia_Galliformes', description='KC758015_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLLVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JN828570_D_Middle.East_Galliformes', name='JN828570_D_Middle.East_Galliformes', description='JN828570_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTTSNADRICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JX273551_D_S.Asia_Galliformes', name='JX273551_D_S.Asia_Galliformes', description='JX273551_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTQAKELLHTE...---', SingleLetterAlphabet()), id='JX273561_D_Middle.East_Galliformes', name='JX273561_D_Middle.East_Galliformes', description='JX273561_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MGAISLMTILLVVTTSNADKICIGHQSTNSTETVNTLTETNVPVTQAKELLHTE...---', SingleLetterAlphabet()), id='JX273562_D_Middle.East_Galliformes', name='JX273562_D_Middle.East_Galliformes', description='JX273562_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIALIVILLVTTTSNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='JX273570_D_Europe_Galliformes', name='JX273570_D_Europe_Galliformes', description='JX273570_D_Europe_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVTLMTILLLVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTD...---', SingleLetterAlphabet()), id='KC757893_D_S.Asia_Galliformes', name='KC757893_D_S.Asia_Galliformes', description='KC757893_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVTLMTILLLVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTD...---', SingleLetterAlphabet()), id='KC758106_D_S.Asia_Galliformes', name='KC758106_D_S.Asia_Galliformes', description='KC758106_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTQAKELLHTE...---', SingleLetterAlphabet()), id='KC555089_D_Middle.East_Anseriformes', name='KC555089_D_Middle.East_Anseriformes', description='KC555089_D_Middle.East_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METTSLITILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KC555097_D_Middle.East_Galliformes', name='KC555097_D_Middle.East_Galliformes', description='KC555097_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIPLTTILLLVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JQ440373_D_Middle.East_Galliformes', name='JQ440373_D_Middle.East_Galliformes', description='JQ440373_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITTLRAILLMVTASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='KJ013297_W_E.Asia.E.China_Anseriformes', name='KJ013297_W_E.Asia.E.China_Anseriformes', description='KJ013297_W_E.Asia.E.China_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEATILITILLTVATSSADKICIGYQSTNSTETVDTLIETNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY157518_W_N.Amer_Anseriformes', name='CY157518_W_N.Amer_Anseriformes', description='CY157518_W_N.Amer_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITTLIAILLMVTASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='KF971949_W_China.Central_Anseriformes', name='KF971949_W_China.Central_Anseriformes', description='KF971949_W_China.Central_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITTLIAILLMVTASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='KF971957_W_China.Central_Anseriformes', name='KF971957_W_China.Central_Anseriformes', description='KF971957_W_China.Central_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITTLIAILLMVTASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='KF971965_W_China.Central_Anseriformes', name='KF971965_W_China.Central_Anseriformes', description='KF971965_W_China.Central_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITTLIAILLMVTASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='KF971973_W_China.Central_Anseriformes', name='KF971973_W_China.Central_Anseriformes', description='KF971973_W_China.Central_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITTLIAILLMVTASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='KF971981_W_China.Central_Anseriformes', name='KF971981_W_China.Central_Anseriformes', description='KF971981_W_China.Central_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITTLIAILLMVTASNADKICIGYQSTNSTETVDTLMENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='KF971989_W_China.Central_Anseriformes', name='KF971989_W_China.Central_Anseriformes', description='KF971989_W_China.Central_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITTLIAILLMVTASNADKICIGYQSTNSTETVDTLMENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='KF971997_W_China.Central_Anseriformes', name='KF971997_W_China.Central_Anseriformes', description='KF971997_W_China.Central_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METASLITMLLVATVSNADKICIGYQSTNSTETVDTLTESNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KJ419953_D_E.Asia.E.China_Galliformes', name='KJ419953_D_E.Asia.E.China_Galliformes', description='KJ419953_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METIPLMAILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JX456181_D_Middle.East_Galliformes', name='JX456181_D_Middle.East_Galliformes', description='JX456181_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MKTISLIIILLLVATSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KC757824_D_S.Asia_Galliformes', name='KC757824_D_S.Asia_Galliformes', description='KC757824_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METITLMTILLLVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTD...---', SingleLetterAlphabet()), id='KC758037_D_S.Asia_Galliformes', name='KC758037_D_S.Asia_Galliformes', description='KC758037_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEATILITILLTVATSSADKICIGYQSTNSTETVDTLIETNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY157526_W_N.Amer_Anseriformes', name='CY157526_W_N.Amer_Anseriformes', description='CY157526_W_N.Amer_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METASLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF714775_D_China.Central_Galliformes', name='KF714775_D_China.Central_Galliformes', description='KF714775_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMAILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLPTE...---', SingleLetterAlphabet()), id='JX294920_D_Middle.East_Galliformes', name='JX294920_D_Middle.East_Galliformes', description='JX294920_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMAILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLPTE...---', SingleLetterAlphabet()), id='JX294921_D_Middle.East_Galliformes', name='JX294921_D_Middle.East_Galliformes', description='JX294921_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIPLMTVLLLVTSSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF998208_D_Middle.East_Galliformes', name='KF998208_D_Middle.East_Galliformes', description='KF998208_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITTLIAILLMVTASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='KF972005_W_China.Central_Anseriformes', name='KF972005_W_China.Central_Anseriformes', description='KF972005_W_China.Central_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITTLIAILLMVTASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='KF972013_W_China.Central_Anseriformes', name='KF972013_W_China.Central_Anseriformes', description='KF972013_W_China.Central_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITTLIAILLMVTASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='KF972021_W_China.Central_Anseriformes', name='KF972021_W_China.Central_Anseriformes', description='KF972021_W_China.Central_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITTLIAILLMVTASNADKICIGYQSTNSTETVDTLXENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='KF972029_W_China.Central_Anseriformes', name='KF972029_W_China.Central_Anseriformes', description='KF972029_W_China.Central_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITTLIAILLMVTASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='KF972037_W_China.Central_Anseriformes', name='KF972037_W_China.Central_Anseriformes', description='KF972037_W_China.Central_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITTLIAILLMVTASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='KF972045_W_China.Central_Anseriformes', name='KF972045_W_China.Central_Anseriformes', description='KF972045_W_China.Central_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITTLIAILLMVTASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='KF972053_W_China.Central_Anseriformes', name='KF972053_W_China.Central_Anseriformes', description='KF972053_W_China.Central_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITTLIAILLMVTASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='KF972061_W_China.Central_Anseriformes', name='KF972061_W_China.Central_Anseriformes', description='KF972061_W_China.Central_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITTLIAILLMVTASNADKICIGYQSTNSTETVDTLMENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='KF972069_W_China.Central_Anseriformes', name='KF972069_W_China.Central_Anseriformes', description='KF972069_W_China.Central_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITTLIAILLMVTASNADKICIGYQSTNSTETVDTLMENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='KF972077_W_China.Central_Anseriformes', name='KF972077_W_China.Central_Anseriformes', description='KF972077_W_China.Central_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITTLIAILLMVTASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='KF972085_W_China.Central_Anseriformes', name='KF972085_W_China.Central_Anseriformes', description='KF972085_W_China.Central_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITTLIAILLMVTASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='KF972093_W_China.Central_Anseriformes', name='KF972093_W_China.Central_Anseriformes', description='KF972093_W_China.Central_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITTLIAILLMVTASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='KF972101_W_China.Central_Anseriformes', name='KF972101_W_China.Central_Anseriformes', description='KF972101_W_China.Central_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITTLIAILLMVTASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='KF972109_W_China.Central_Anseriformes', name='KF972109_W_China.Central_Anseriformes', description='KF972109_W_China.Central_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITTLIAILLMVTASNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='KF972117_W_China.Central_Anseriformes', name='KF972117_W_China.Central_Anseriformes', description='KF972117_W_China.Central_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMAILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLPTE...---', SingleLetterAlphabet()), id='JX294922_D_Middle.East_Galliformes', name='JX294922_D_Middle.East_Galliformes', description='JX294922_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIPLMTILLLVTTNNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JX912984_D_Middle.East_Galliformes', name='JX912984_D_Middle.East_Galliformes', description='JX912984_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVVTVCNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KC920697_D_E.Asia.E.China_Galliformes', name='KC920697_D_E.Asia.E.China_Galliformes', description='KC920697_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METASLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF715244_D_China.West_Galliformes', name='KF715244_D_China.West_Galliformes', description='KF715244_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIPLMTILLLVTTNNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JX912990_D_Middle.East_Galliformes', name='JX912990_D_Middle.East_Galliformes', description='JX912990_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIPLMTILLLVTTNNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF258174_D_Middle.East_Galliformes', name='KF258174_D_Middle.East_Galliformes', description='KF258174_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIPLMTILLLVTTNNADNICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF881394_D_Middle.East_Galliformes', name='KF881394_D_Middle.East_Galliformes', description='KF881394_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIPLMTILLLVTTNNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF998210_D_Middle.East_Galliformes', name='KF998210_D_Middle.East_Galliformes', description='KF998210_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIPLTTILLLVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF998211_D_Middle.East_Galliformes', name='KF998211_D_Middle.East_Galliformes', description='KF998211_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KC920696_D_E.Asia.E.China_Galliformes', name='KC920696_D_E.Asia.E.China_Galliformes', description='KC920696_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIPLMTILLLVTTNNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF881475_D_Middle.East_Galliformes', name='KF881475_D_Middle.East_Galliformes', description='KF881475_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIPLMTILLLVTTNNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF881732_D_Middle.East_Galliformes', name='KF881732_D_Middle.East_Galliformes', description='KF881732_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIPLMTILLLVTTNNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF998214_D_Middle.East_Galliformes', name='KF998214_D_Middle.East_Galliformes', description='KF998214_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAATIITILLVVTGSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF259143_D_China.Central_Galliformes', name='KF259143_D_China.Central_Galliformes', description='KF259143_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAATIITILLVITGSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF259144_D_China.Central_Galliformes', name='KF259144_D_China.Central_Galliformes', description='KF259144_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAATIITILLVITGSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF259147_D_China.Central_Galliformes', name='KF259147_D_China.Central_Galliformes', description='KF259147_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAATIITILLVITGSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTG...---', SingleLetterAlphabet()), id='KF259148_D_China.Central_Galliformes', name='KF259148_D_China.Central_Galliformes', description='KF259148_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAATIITILLVITGNNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF259156_D_China.Central_Galliformes', name='KF259156_D_China.Central_Galliformes', description='KF259156_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVTIITILLVITRSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF259157_D_China.Central_Galliformes', name='KF259157_D_China.Central_Galliformes', description='KF259157_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVVTVCNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KC920691_D_E.Asia.E.China_Galliformes', name='KC920691_D_E.Asia.E.China_Galliformes', description='KC920691_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEATILITILLTVATSSADKICIGYQSTNSTETVDTLIETNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY157534_W_N.Amer_Anseriformes', name='CY157534_W_N.Amer_Anseriformes', description='CY157534_W_N.Amer_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KC879302_D_E.Asia.E.China_Galliformes', name='KC879302_D_E.Asia.E.China_Galliformes', description='KC879302_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITMLLAVAASNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KC767259_D_China.West_Galliformes', name='KC767259_D_China.West_Galliformes', description='KC767259_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLLVTVSNADKICIGYQSTNSTETVDTLTENDVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KC879299_D_E.Asia.E.China_Galliformes', name='KC879299_D_E.Asia.E.China_Galliformes', description='KC879299_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLLVTVSNADKICIGYQSTNSTETVDTLTENDVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KC879300_D_China.Central_Galliformes', name='KC879300_D_China.Central_Galliformes', description='KC879300_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METTSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF638575_D_China.West_Galliformes', name='KF638575_D_China.West_Galliformes', description='KF638575_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIPLMIVLLLVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF258186_D_Middle.East_Galliformes', name='KF258186_D_Middle.East_Galliformes', description='KF258186_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIPLMTVLLLVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF258191_D_Middle.East_Galliformes', name='KF258191_D_Middle.East_Galliformes', description='KF258191_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIPLMTVLLLVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF881640_D_Middle.East_Galliformes', name='KF881640_D_Middle.East_Galliformes', description='KF881640_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METTSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF638574_D_China.Central_Galliformes', name='KF638574_D_China.Central_Galliformes', description='KF638574_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIPLMTVLLLVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF258183_D_Middle.East_Galliformes', name='KF258183_D_Middle.East_Galliformes', description='KF258183_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIPLMTVLLLVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF258184_D_Middle.East_Galliformes', name='KF258184_D_Middle.East_Galliformes', description='KF258184_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIPLMTVLLLVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF258190_D_Middle.East_Galliformes', name='KF258190_D_Middle.East_Galliformes', description='KF258190_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIPLMTILLLVTTNNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF881378_D_Middle.East_Galliformes', name='KF881378_D_Middle.East_Galliformes', description='KF881378_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MRIIPLTTILLLVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF881459_D_Middle.East_Galliformes', name='KF881459_D_Middle.East_Galliformes', description='KF881459_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MGIIPLMTVLLLVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF881553_D_Middle.East_Galliformes', name='KF881553_D_Middle.East_Galliformes', description='KF881553_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MGIIPLMTILLLVTTNNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF881370_D_Middle.East_Galliformes', name='KF881370_D_Middle.East_Galliformes', description='KF881370_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAATIITILLAITGSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='AB836739_D_SE.Asia_Galliformes', name='AB836739_D_SE.Asia_Galliformes', description='AB836739_D_SE.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEALSLITTLLVATVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KJ419949_D_E.Asia.E.China_Galliformes', name='KJ419949_D_E.Asia.E.China_Galliformes', description='KJ419949_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAATIITILLAITGSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='AB841272_D_SE.Asia_Anseriformes', name='AB841272_D_SE.Asia_Anseriformes', description='AB841272_D_SE.Asia_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITILLVATVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF259159_D_E.Asia.E.China_Galliformes', name='KF259159_D_E.Asia.E.China_Galliformes', description='KF259159_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITILLVATVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF259160_D_E.Asia.E.China_Galliformes', name='KF259160_D_E.Asia.E.China_Galliformes', description='KF259160_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITILLVATVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF259166_D_E.Asia.E.China_Galliformes', name='KF259166_D_E.Asia.E.China_Galliformes', description='KF259166_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHARELLHTE...---', SingleLetterAlphabet()), id='KF259169_D_E.Asia.E.China_Galliformes', name='KF259169_D_E.Asia.E.China_Galliformes', description='KF259169_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHARELLHTE...---', SingleLetterAlphabet()), id='KF259171_D_E.Asia.E.China_Galliformes', name='KF259171_D_E.Asia.E.China_Galliformes', description='KF259171_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METASLITILLVATVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF259184_D_E.Asia.E.China_Galliformes', name='KF259184_D_E.Asia.E.China_Galliformes', description='KF259184_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITILLVATVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF259186_D_E.Asia.E.China_Galliformes', name='KF259186_D_E.Asia.E.China_Galliformes', description='KF259186_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITILLVATVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF297299_D_E.Asia.E.China_Galliformes', name='KF297299_D_E.Asia.E.China_Galliformes', description='KF297299_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITILLVVTASNADKICIGYQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JX465626_D_Middle.East_Galliformes', name='JX465626_D_Middle.East_Galliformes', description='JX465626_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='HM773438_D_E.Asia.E.China_Galliformes', name='HM773438_D_E.Asia.E.China_Galliformes', description='HM773438_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAVSLITILLVVTASNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='FJ190124_D_China.Central_Galliformes', name='FJ190124_D_China.Central_Galliformes', description='FJ190124_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLRTILLVVTASNADKICIAYQSTNSTETVDTLTETNVPVTHATELLHTE...---', SingleLetterAlphabet()), id='KF313567_D_E.Asia.E.China_Galliformes', name='KF313567_D_E.Asia.E.China_Galliformes', description='KF313567_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEATSLITILLLVTTSNADKICIGYQSTNSTETVDTLAENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='FJ190129_D_E.Asia.E.China_Galliformes', name='FJ190129_D_E.Asia.E.China_Galliformes', description='FJ190129_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='FJ190150_D_China.West_Galliformes', name='FJ190150_D_China.West_Galliformes', description='FJ190150_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='FJ190123_D_China.Central_Galliformes', name='FJ190123_D_China.Central_Galliformes', description='FJ190123_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAVSLITILLVVTASNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='FJ190128_D_E.Asia.E.China_Galliformes', name='FJ190128_D_E.Asia.E.China_Galliformes', description='FJ190128_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JQ710462_D_E.Asia.E.China_Galliformes', name='JQ710462_D_E.Asia.E.China_Galliformes', description='JQ710462_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEATSLITILLLVTTSNADKICIGYQSTNSTETVDTLAENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='FJ190117_D_E.Asia.E.China_Galliformes', name='FJ190117_D_E.Asia.E.China_Galliformes', description='FJ190117_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLIIILLVVTTSNADKICIGHQSTNSTETVNTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EU665422_D_S.Asia_Galliformes', name='EU665422_D_S.Asia_Galliformes', description='EU665422_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLLVTASNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF688983_D_E.Asia.E.China_Galliformes', name='KF688983_D_E.Asia.E.China_Galliformes', description='KF688983_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MDVVSLITIPLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF313559_D_E.Asia.E.China_Galliformes', name='KF313559_D_E.Asia.E.China_Galliformes', description='KF313559_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLIIILLVVTTSNADKICIVHQSTNSTETVNTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='EU665423_D_S.Asia_Galliformes', name='EU665423_D_S.Asia_Galliformes', description='EU665423_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVASLITVLLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='HM773435_D_E.Asia.E.China_Galliformes', name='HM773435_D_E.Asia.E.China_Galliformes', description='HM773435_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITALIAILLVTTTSNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='HM136574_W_Europe_Anseriformes', name='HM136574_W_Europe_Anseriformes', description='HM136574_W_Europe_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITVLLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='HM773436_D_E.Asia.E.China_Galliformes', name='HM773436_D_E.Asia.E.China_Galliformes', description='HM773436_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVLLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JQ710463_D_E.Asia.E.China_Galliformes', name='JQ710463_D_E.Asia.E.China_Galliformes', description='JQ710463_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIISLITILLSVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KC986294_D_S.Asia_Galliformes', name='KC986294_D_S.Asia_Galliformes', description='KC986294_D_S.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLIATASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLQTE...---', SingleLetterAlphabet()), id='AB753177_D_SE.Asia_Galliformes', name='AB753177_D_SE.Asia_Galliformes', description='AB753177_D_SE.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITMLLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='FJ231866_D_E.Asia.E.China_Galliformes', name='FJ231866_D_E.Asia.E.China_Galliformes', description='FJ231866_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITMLLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='FJ434561_D_China.West_Galliformes', name='FJ434561_D_China.West_Galliformes', description='FJ434561_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITMLLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='FJ434562_D_China.West_Galliformes', name='FJ434562_D_China.West_Galliformes', description='FJ434562_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITMLLVVTMSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='FJ434572_D_E.Asia.E.China_Galliformes', name='FJ434572_D_E.Asia.E.China_Galliformes', description='FJ434572_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITMLLVVTMSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='FJ434585_D_China.Central_Galliformes', name='FJ434585_D_China.Central_Galliformes', description='FJ434585_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITMLLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='FJ434586_D_E.Asia.E.China_Galliformes', name='FJ434586_D_E.Asia.E.China_Galliformes', description='FJ434586_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MKTISLITILLVVTTSNADKICIGHQSTNSTETVDTLAETNIPVTHAKELLHTE...VYN', SingleLetterAlphabet()), id='GU071977_D_Middle.East_Galliformes', name='GU071977_D_Middle.East_Galliformes', description='GU071977_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MKTISLITILLVVTASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='GU071980_D_Middle.East_Galliformes', name='GU071980_D_Middle.East_Galliformes', description='GU071980_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METASLITMLLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='FJ434563_D_China.West_Galliformes', name='FJ434563_D_China.West_Galliformes', description='FJ434563_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METASLITMLLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='FJ434564_D_China.West_Galliformes', name='FJ434564_D_China.West_Galliformes', description='FJ434564_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='HQ326722_D_E.Asia.E.China_Galliformes', name='HQ326722_D_E.Asia.E.China_Galliformes', description='HQ326722_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITMLLVATVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='FJ434582_D_E.Asia.E.China_Galliformes', name='FJ434582_D_E.Asia.E.China_Galliformes', description='FJ434582_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF313561_D_China.Central_Galliformes', name='KF313561_D_China.Central_Galliformes', description='KF313561_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITILLVVTASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='FJ794818_D_Middle.East_Galliformes', name='FJ794818_D_Middle.East_Galliformes', description='FJ794818_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JQ973661_D_Middle.East_Galliformes', name='JQ973661_D_Middle.East_Galliformes', description='JQ973661_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVIALIAILVVTGASNADKICIGYQSTNSTETVDTLVETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='HQ221678_D_E.Asia.E.China_Galliformes', name='HQ221678_D_E.Asia.E.China_Galliformes', description='HQ221678_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVIALIAILVVTGTSNADKICIGYQSTNSTETVDTLVETNVPVTHAKELLHTK...---', SingleLetterAlphabet()), id='HQ221679_D_E.Asia.E.China_Galliformes', name='HQ221679_D_E.Asia.E.China_Galliformes', description='HQ221679_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='HM773434_D_E.Asia.E.China_Galliformes', name='HM773434_D_E.Asia.E.China_Galliformes', description='HM773434_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MGIISLMTILLLVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JQ254940_D_Middle.East_Galliformes', name='JQ254940_D_Middle.East_Galliformes', description='JQ254940_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MKSIVLIAILLVATTSNADKICIGYQSTNSTETVDTLIESNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='AB545593_D_SE.Asia_Anseriformes', name='AB545593_D_SE.Asia_Anseriformes', description='AB545593_D_SE.Asia_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVIALIAILVVTGTSNADKICIGYQSTNSTETVDTLVETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JN852803_D_E.Asia.E.China_Galliformes', name='JN852803_D_E.Asia.E.China_Galliformes', description='JN852803_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MGIISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JQ254937_D_Middle.East_Galliformes', name='JQ254937_D_Middle.East_Galliformes', description='JQ254937_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METIPLMAILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JQ419718_D_Middle.East_Galliformes', name='JQ419718_D_Middle.East_Galliformes', description='JQ419718_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIALIAILLVTTMSNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='CY080415_W_Europe_Anseriformes', name='CY080415_W_Europe_Anseriformes', description='CY080415_W_Europe_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METASLITILLIATVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='AB753192_D_SE.Asia_Galliformes', name='AB753192_D_SE.Asia_Galliformes', description='AB753192_D_SE.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITMLLVATVINADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='AB753213_D_SE.Asia_Galliformes', name='AB753213_D_SE.Asia_Galliformes', description='AB753213_D_SE.Asia_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METIPLMAILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JQ419722_D_Middle.East_Galliformes', name='JQ419722_D_Middle.East_Galliformes', description='JQ419722_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METTSLITILLVVTTSNADKICIGHQSTNSTETVDTLTETNIPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JQ419723_D_Middle.East_Galliformes', name='JQ419723_D_Middle.East_Galliformes', description='JQ419723_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METASLITMLLIATVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JN683644_D_E.Asia.E.China_Galliformes', name='JN683644_D_E.Asia.E.China_Galliformes', description='JN683644_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMAILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JN646748_D_Middle.East_Galliformes', name='JN646748_D_Middle.East_Galliformes', description='JN646748_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITMLLVATVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JN683647_D_E.Asia.E.China_Galliformes', name='JN683647_D_E.Asia.E.China_Galliformes', description='JN683647_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JN803952_D_E.Asia.E.China_Galliformes', name='JN803952_D_E.Asia.E.China_Galliformes', description='JN803952_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JN803960_D_E.Asia.E.China_Galliformes', name='JN803960_D_E.Asia.E.China_Galliformes', description='JN803960_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JN803964_D_E.Asia.E.China_Galliformes', name='JN803964_D_E.Asia.E.China_Galliformes', description='JN803964_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITMLLVATVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JN803976_D_China.Central_Galliformes', name='JN803976_D_China.Central_Galliformes', description='JN803976_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JN803993_D_China.Central_Anseriformes', name='JN803993_D_China.Central_Anseriformes', description='JN803993_D_China.Central_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JN803994_D_China.Central_Anseriformes', name='JN803994_D_China.Central_Anseriformes', description='JN803994_D_China.Central_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITILLVVTVSNAHKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JN803999_D_China.Central_Anseriformes', name='JN803999_D_China.Central_Anseriformes', description='JN803999_D_China.Central_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JF715003_D_E.Asia.E.China_Galliformes', name='JF715003_D_E.Asia.E.China_Galliformes', description='JF715003_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY093088_D_Middle.East_Galliformes', name='CY093088_D_Middle.East_Galliformes', description='CY093088_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY093096_D_Middle.East_Galliformes', name='CY093096_D_Middle.East_Galliformes', description='CY093096_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITMLLVATVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JF714997_D_China.Central_Galliformes', name='JF714997_D_China.Central_Galliformes', description='JF714997_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVITGSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JF714998_D_China.Central_Galliformes', name='JF714998_D_China.Central_Galliformes', description='JF714998_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIISLMTVLLVVTTSNADKICIGHQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JQ254942_D_Middle.East_Galliformes', name='JQ254942_D_Middle.East_Galliformes', description='JQ254942_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVITTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JQ254945_D_Middle.East_Galliformes', name='JQ254945_D_Middle.East_Galliformes', description='JQ254945_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVITTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JQ254948_D_Middle.East_Galliformes', name='JQ254948_D_Middle.East_Galliformes', description='JQ254948_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVITTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JQ254952_D_Middle.East_Galliformes', name='JQ254952_D_Middle.East_Galliformes', description='JQ254952_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIISLMTVLLVVTTSNADKICIGHQSTNSTETVDTLTENNIPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JQ254954_D_Middle.East_Galliformes', name='JQ254954_D_Middle.East_Galliformes', description='JQ254954_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METIALIAILLLTTACNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='JQ609664_D_Europe_Galliformes', name='JQ609664_D_Europe_Galliformes', description='JQ609664_D_Europe_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITTLLAITTSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JF715033_D_China.Central_Galliformes', name='JF715033_D_China.Central_Galliformes', description='JF715033_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITTLLAVTTSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JF715036_D_E.Asia.E.China_Galliformes', name='JF715036_D_E.Asia.E.China_Galliformes', description='JF715036_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVITGSNADKIRIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JF715044_D_China.Central_Galliformes', name='JF715044_D_China.Central_Galliformes', description='JF715044_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLLITGSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JF715046_D_China.Central_Galliformes', name='JF715046_D_China.Central_Galliformes', description='JF715046_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVITGSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JF715048_D_China.Central_Galliformes', name='JF715048_D_China.Central_Galliformes', description='JF715048_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLLITGSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JF715051_D_China.Central_Galliformes', name='JF715051_D_China.Central_Galliformes', description='JF715051_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JF715018_D_E.Asia.E.China_Galliformes', name='JF715018_D_E.Asia.E.China_Galliformes', description='JF715018_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JX448760_D_E.Asia.E.China_Galliformes', name='JX448760_D_E.Asia.E.China_Galliformes', description='JX448760_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITTLLVITVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JN804504_D_E.Asia.E.China_Galliformes', name='JN804504_D_E.Asia.E.China_Galliformes', description='JN804504_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JN804513_D_China.West_Galliformes', name='JN804513_D_China.West_Galliformes', description='JN804513_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITMLLVATVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JN804515_D_China.West_Galliformes', name='JN804515_D_China.West_Galliformes', description='JN804515_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITMLLVATVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JN804520_D_China.West_Galliformes', name='JN804520_D_China.West_Galliformes', description='JN804520_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITMLLVATVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JN804521_D_China.West_Galliformes', name='JN804521_D_China.West_Galliformes', description='JN804521_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITMLLVATVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JN804523_D_China.West_Galliformes', name='JN804523_D_China.West_Galliformes', description='JN804523_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITMLLVATVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JN804525_D_China.West_Galliformes', name='JN804525_D_China.West_Galliformes', description='JN804525_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVATLITILLVITGNNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JN804526_D_China.West_Galliformes', name='JN804526_D_China.West_Galliformes', description='JN804526_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVATLITILLVITGNNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JN804527_D_China.West_Galliformes', name='JN804527_D_China.West_Galliformes', description='JN804527_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVLLMTTLLAITTSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JN804534_D_China.Central_Galliformes', name='JN804534_D_China.Central_Galliformes', description='JN804534_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JN804540_D_China.Central_Galliformes', name='JN804540_D_China.Central_Galliformes', description='JN804540_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METASLITMLLVATVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JN804542_D_China.West_Galliformes', name='JN804542_D_China.West_Galliformes', description='JN804542_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITILLVLTVSNADKICIGYQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JN804543_D_China.West_Galliformes', name='JN804543_D_China.West_Galliformes', description='JN804543_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITILLVLTVSNADKICIGYQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JN804544_D_China.West_Galliformes', name='JN804544_D_China.West_Galliformes', description='JN804544_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITILLVLTVSNADKICIGYQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JN804545_D_China.West_Galliformes', name='JN804545_D_China.West_Galliformes', description='JN804545_D_China.West_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITILLVLTVSNADKICIGYQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JN804547_D_China.West_Anseriformes', name='JN804547_D_China.West_Anseriformes', description='JN804547_D_China.West_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAATIITILLAITGSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JN804557_D_China.Central_Galliformes', name='JN804557_D_China.Central_Galliformes', description='JN804557_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITPLMTILLLVTTSNADKICIGHQSTNSTETVDTLAETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JQ906555_D_Middle.East_Galliformes', name='JQ906555_D_Middle.East_Galliformes', description='JQ906555_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIALIAILLVTTTSNADKICIGYQSTNSTETVDTLIENNVPVTHTKELLHTE...---', SingleLetterAlphabet()), id='KC162234_W_E.Asia.E.China_Anseriformes', name='KC162234_W_E.Asia.E.China_Anseriformes', description='KC162234_W_E.Asia.E.China_Anseriformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIPLTTILLLVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY110927_D_Middle.East_Galliformes', name='CY110927_D_Middle.East_Galliformes', description='CY110927_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIPLTTILLLVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='CY110928_D_Middle.East_Galliformes', name='CY110928_D_Middle.East_Galliformes', description='CY110928_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVITGSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JQ770133_D_China.Central_Galliformes', name='JQ770133_D_China.Central_Galliformes', description='JQ770133_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTQAKELLHTE...---', SingleLetterAlphabet()), id='JQ973658_D_Middle.East_Galliformes', name='JQ973658_D_Middle.East_Galliformes', description='JQ973658_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEITSLMTILLVITTSSADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JQ973660_D_Middle.East_Galliformes', name='JQ973660_D_Middle.East_Galliformes', description='JQ973660_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTQAKELLHTE...---', SingleLetterAlphabet()), id='JQ973652_D_Middle.East_Galliformes', name='JQ973652_D_Middle.East_Galliformes', description='JQ973652_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEPISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTQAKELLHTE...---', SingleLetterAlphabet()), id='JQ973653_D_Middle.East_Galliformes', name='JQ973653_D_Middle.East_Galliformes', description='JQ973653_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIISLMTVLLVVTTSNADKICIGHQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JQ973654_D_Middle.East_Galliformes', name='JQ973654_D_Middle.East_Galliformes', description='JQ973654_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVATVSYADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KC417046_D_E.Asia.E.China_Galliformes', name='KC417046_D_E.Asia.E.China_Galliformes', description='KC417046_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIPLTTILLLVTTSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JQ906557_D_Middle.East_Galliformes', name='JQ906557_D_Middle.East_Galliformes', description='JQ906557_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIIPLMTVLLLVTSSNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JQ906558_D_Middle.East_Galliformes', name='JQ906558_D_Middle.East_Galliformes', description='JQ906558_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METASLMTILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KC817014_D_China.Central_Galliformes', name='KC817014_D_China.Central_Galliformes', description='KC817014_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITTLLAVTTSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JX448765_D_E.Asia.E.China_Galliformes', name='JX448765_D_E.Asia.E.China_Galliformes', description='JX448765_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEVVSLITILLVVTVCNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='JX846585_D_China.Central_Galliformes', name='JX846585_D_China.Central_Galliformes', description='JX846585_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METVSLITILLVATISNADKICIGYQSTNSTETVDTLTENNVPVTHVKELLHTE...---', SingleLetterAlphabet()), id='KC951122_D_China.Central_Galliformes', name='KC951122_D_China.Central_Galliformes', description='KC951122_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEIISLMTVLLVVTTSNADKICIGHQSTNSTETVDTLTENNIPVTHAKELLHTE...---', SingleLetterAlphabet()), id='KF918709_D_Middle.East_Galliformes', name='KF918709_D_Middle.East_Galliformes', description='KF918709_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('MEAISLMTILLVVTTSNADKICIGHQSTNSTETVDTLTETNVPVTQAKELLHTE...---', SingleLetterAlphabet()), id='KF918708_D_Middle.East_Galliformes', name='KF918708_D_Middle.East_Galliformes', description='KF918708_D_Middle.East_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTASNADKICIGHQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='AF156378_D_China.Central_Galliformes', name='AF156378_D_China.Central_Galliformes', description='AF156378_D_China.Central_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLITILLVVTASNADKICIGYQSTNSTETVDTLTETNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='AF156380_D_E.Asia.E.China_Galliformes', name='AF156380_D_E.Asia.E.China_Galliformes', description='AF156380_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[]),
SeqRecord(seq=Seq('METISLIAILLVVTVSNADKICIGYQSTNSTETVDTLTENNVPVTHAKELLHTE...---', SingleLetterAlphabet()), id='AF461532_D_E.Asia.E.China_Galliformes', name='AF461532_D_E.Asia.E.China_Galliformes', description='AF461532_D_E.Asia.E.China_Galliformes <unknown description>', dbxrefs=[])]
In [9]:
df = pd.DataFrame(np.array(genes))
# Capture accession and wild or domestic status as an array.
labels_wd = []
labels_geo = []
labels_wd_geo = []
labels_species = []
labels_wd_species = []
labels_wd_geo_species = []
for sequence in genes:
if 'nan' in sequence.id:
pass
else:
sequence_id = sequence.id.split("_")
label_wd = sequence_id[1]
label_geo = sequence_id[2]
label_wd_geo = label_wd + '-' + label_geo
label_species = sequence_id[3]
label_wd_species = label_wd + "-" + label_species
label_wd_geo_species = label_wd + "_" + label_geo + "_" + label_species
labels_wd.append(label_wd)
labels_geo.append(label_geo)
labels_wd_geo.append(label_wd_geo)
labels_species.append(label_species)
labels_wd_species.append(label_wd_species)
labels_wd_geo_species.append(label_wd_geo_species)
# Remove any positions that do not contain any variation
for column in df.columns:
if len(np.unique(df[column].values)) == 1:
del df[column]
df
Out[9]:
0
1
2
3
4
5
6
7
8
9
...
556
557
558
559
560
561
562
563
564
565
0
M
E
T
K
A
L
I
A
I
L
...
N
I
C
I
-
-
-
-
-
-
1
M
E
T
T
T
L
I
A
I
L
...
N
I
C
I
-
-
-
-
-
-
2
M
E
T
I
A
P
I
A
I
L
...
N
I
C
I
-
-
-
-
-
-
3
M
E
I
T
T
L
I
A
I
L
...
N
I
C
I
-
-
-
-
-
-
4
M
E
I
T
T
L
V
A
I
L
...
N
I
C
I
-
-
-
-
-
-
5
M
E
I
T
T
L
V
A
I
L
...
N
I
C
I
-
-
-
-
-
-
6
M
E
I
T
T
L
V
A
I
L
...
N
I
C
I
-
-
-
-
-
-
7
M
E
I
T
A
L
I
A
I
L
...
N
I
C
I
-
-
-
-
-
-
8
M
E
T
I
S
L
I
T
I
L
...
N
-
-
-
-
-
-
-
-
-
9
M
E
I
I
A
L
I
A
I
L
...
N
I
C
I
-
-
-
-
-
-
10
M
E
I
I
A
L
I
A
I
L
...
N
I
C
I
-
-
-
-
-
-
11
M
E
T
R
T
L
I
A
A
L
...
N
I
C
I
-
-
-
-
-
-
12
M
E
T
T
S
L
I
T
I
L
...
N
I
C
I
-
-
-
-
-
-
13
M
E
I
I
A
L
I
A
I
L
...
N
I
C
I
-
-
-
-
-
-
14
M
E
A
V
S
L
I
T
I
L
...
N
I
C
I
-
-
-
-
-
-
15
M
E
A
V
S
L
I
T
I
L
...
N
I
C
I
-
-
-
-
-
-
16
M
E
A
T
A
I
I
T
I
L
...
N
I
C
I
-
-
-
-
-
-
17
M
E
Q
V
S
L
I
T
I
L
...
N
I
C
I
-
-
-
-
-
-
18
M
E
T
I
S
L
I
T
I
L
...
N
I
C
I
-
-
-
-
-
-
19
M
E
T
I
S
L
I
A
I
L
...
N
I
C
I
-
-
-
-
-
-
20
M
E
T
I
S
L
I
T
I
L
...
N
I
C
I
-
-
-
-
-
-
21
M
E
T
V
S
L
I
T
I
L
...
N
I
C
I
-
-
-
-
-
-
22
M
E
T
T
S
L
L
T
I
L
...
S
I
E
-
-
-
-
-
-
-
23
M
E
Q
V
S
L
I
T
I
L
...
N
I
C
-
-
-
-
-
-
-
24
M
E
T
I
S
L
I
T
I
L
...
N
I
C
I
-
-
-
-
-
-
25
M
E
T
I
S
L
I
T
I
I
...
N
I
C
I
-
-
-
-
-
-
26
M
E
T
R
S
L
I
T
I
L
...
-
-
-
-
-
-
-
-
-
-
27
M
E
T
I
S
L
I
T
I
L
...
-
-
-
-
-
-
-
-
-
-
28
M
E
T
I
S
L
I
T
I
L
...
-
-
-
-
-
-
-
-
-
-
29
M
E
T
R
S
L
I
T
I
L
...
-
-
-
-
-
-
-
-
-
-
...
...
...
...
...
...
...
...
...
...
...
...
...
...
...
...
...
...
...
...
...
...
547
M
E
T
V
L
L
M
T
T
L
...
N
I
-
-
-
-
-
-
-
-
548
M
E
T
V
S
L
I
T
I
L
...
N
I
-
-
-
-
-
-
-
-
549
M
E
T
A
S
L
I
T
M
L
...
N
I
-
-
-
-
-
-
-
-
550
M
E
T
V
S
L
I
T
I
L
...
N
I
-
-
-
-
-
-
-
-
551
M
E
T
V
S
L
I
T
I
L
...
N
I
-
-
-
-
-
-
-
-
552
M
E
T
V
S
L
I
T
I
L
...
N
I
-
-
-
-
-
-
-
-
553
M
E
T
V
S
L
I
T
I
L
...
N
I
-
-
-
-
-
-
-
-
554
M
E
A
A
T
I
I
T
I
L
...
N
I
-
-
-
-
-
-
-
-
555
M
E
I
T
P
L
M
T
I
L
...
N
I
C
I
-
-
-
-
-
-
556
M
E
I
I
A
L
I
A
I
L
...
N
I
C
I
-
-
-
-
-
-
557
M
E
I
I
P
L
T
T
I
L
...
N
I
C
I
-
-
-
-
-
-
558
M
E
I
I
P
L
T
T
I
L
...
N
I
C
I
-
-
-
-
-
-
559
M
E
V
V
S
L
I
T
I
L
...
N
I
C
I
-
-
-
-
-
-
560
M
E
I
I
S
L
M
T
I
L
...
N
I
C
I
-
-
-
-
-
-
561
M
E
I
T
S
L
M
T
I
L
...
N
I
C
I
-
-
-
-
-
-
562
M
E
T
I
S
L
M
T
I
L
...
N
I
C
I
-
-
-
-
-
-
563
M
E
P
I
S
L
M
T
I
L
...
N
I
C
I
-
-
-
-
-
-
564
M
E
I
I
S
L
M
T
V
L
...
N
I
C
I
-
-
-
-
-
-
565
M
E
V
V
S
L
I
T
I
L
...
N
I
C
I
-
-
-
-
-
-
566
M
E
I
I
P
L
T
T
I
L
...
-
-
-
-
-
-
-
-
-
-
567
M
E
I
I
P
L
M
T
V
L
...
-
-
-
-
-
-
-
-
-
-
568
M
E
T
A
S
L
M
T
I
L
...
N
I
C
I
-
-
-
-
-
-
569
M
E
V
V
S
L
I
T
T
L
...
N
I
C
I
-
-
-
-
-
-
570
M
E
V
V
S
L
I
T
I
L
...
N
I
C
I
-
-
-
-
-
-
571
M
E
T
V
S
L
I
T
I
L
...
N
I
C
I
-
-
-
-
-
-
572
M
E
I
I
S
L
M
T
V
L
...
N
I
C
I
-
-
-
-
-
-
573
M
E
A
I
S
L
M
T
I
L
...
N
I
C
I
-
-
-
-
-
-
574
M
E
T
I
S
L
I
T
I
L
...
-
-
-
-
-
-
-
-
-
-
575
M
E
T
I
S
L
I
T
I
L
...
-
-
-
-
-
-
-
-
-
-
576
M
E
T
I
S
L
I
A
I
L
...
N
I
C
I
-
-
-
-
-
-
577 rows × 455 columns
In [11]:
print(len(df))
print(len(labels_species))
np.unique(labels_wd_species)
np.unique(labels_wd_geo_species)
577
577
Out[11]:
array(['D_China.Central_Anseriformes', 'D_China.Central_Galliformes',
'D_China.West_Anseriformes', 'D_China.West_Galliformes',
'D_E.Asia.E.China_Anseriformes', 'D_E.Asia.E.China_Galliformes',
'D_Europe_Galliformes', 'D_Middle.East_Anseriformes',
'D_Middle.East_Galliformes', 'D_S.Asia_Anseriformes',
'D_S.Asia_Galliformes', 'D_SE.Asia_Anseriformes',
'D_SE.Asia_Galliformes', 'W_China.Central_Anseriformes',
'W_E.Asia.E.China_Anseriformes', 'W_Europe_Anseriformes',
'W_Europe_Charadriiformes', 'W_Middle.East_Anseriformes',
'W_Middle.East_Charadriiformes', 'W_N.Amer_Anseriformes',
'W_N.Amer_Charadriiformes'],
dtype='|S29')
In [21]:
from random import shuffle
# Encode the amino acids with categorial labels 1-20
le = LabelEncoder()
amino_acid_code = (list('ABCDEFGHIJKLMNPQRSTVWXY-'))
shuffle(amino_acid_code)
print(len(amino_acid_code))
le.fit(amino_acid_code)
a_encoded = le.transform(amino_acid_code)
# a_encoded
# Replace amino acids with integer numbers.
encode_dict = {letter:int(encode) for letter, encode in zip(amino_acid_code, a_encoded)}
# encode_dict
encoded_df = df.replace(to_replace=encode_dict.keys(), value=encode_dict.values())
encoded_df
24
Out[21]:
0
1
2
3
4
5
6
7
8
9
...
556
557
558
559
560
561
562
563
564
565
0
13
5
19
11
1
12
9
1
9
12
...
14
9
3
9
0
0
0
0
0
0
1
13
5
19
19
19
12
9
1
9
12
...
14
9
3
9
0
0
0
0
0
0
2
13
5
19
9
1
15
9
1
9
12
...
14
9
3
9
0
0
0
0
0
0
3
13
5
9
19
19
12
9
1
9
12
...
14
9
3
9
0
0
0
0
0
0
4
13
5
9
19
19
12
20
1
9
12
...
14
9
3
9
0
0
0
0
0
0
5
13
5
9
19
19
12
20
1
9
12
...
14
9
3
9
0
0
0
0
0
0
6
13
5
9
19
19
12
20
1
9
12
...
14
9
3
9
0
0
0
0
0
0
7
13
5
9
19
1
12
9
1
9
12
...
14
9
3
9
0
0
0
0
0
0
8
13
5
19
9
18
12
9
19
9
12
...
14
0
0
0
0
0
0
0
0
0
9
13
5
9
9
1
12
9
1
9
12
...
14
9
3
9
0
0
0
0
0
0
10
13
5
9
9
1
12
9
1
9
12
...
14
9
3
9
0
0
0
0
0
0
11
13
5
19
17
19
12
9
1
1
12
...
14
9
3
9
0
0
0
0
0
0
12
13
5
19
19
18
12
9
19
9
12
...
14
9
3
9
0
0
0
0
0
0
13
13
5
9
9
1
12
9
1
9
12
...
14
9
3
9
0
0
0
0
0
0
14
13
5
1
20
18
12
9
19
9
12
...
14
9
3
9
0
0
0
0
0
0
15
13
5
1
20
18
12
9
19
9
12
...
14
9
3
9
0
0
0
0
0
0
16
13
5
1
19
1
9
9
19
9
12
...
14
9
3
9
0
0
0
0
0
0
17
13
5
16
20
18
12
9
19
9
12
...
14
9
3
9
0
0
0
0
0
0
18
13
5
19
9
18
12
9
19
9
12
...
14
9
3
9
0
0
0
0
0
0
19
13
5
19
9
18
12
9
1
9
12
...
14
9
3
9
0
0
0
0
0
0
20
13
5
19
9
18
12
9
19
9
12
...
14
9
3
9
0
0
0
0
0
0
21
13
5
19
20
18
12
9
19
9
12
...
14
9
3
9
0
0
0
0
0
0
22
13
5
19
19
18
12
12
19
9
12
...
18
9
5
0
0
0
0
0
0
0
23
13
5
16
20
18
12
9
19
9
12
...
14
9
3
0
0
0
0
0
0
0
24
13
5
19
9
18
12
9
19
9
12
...
14
9
3
9
0
0
0
0
0
0
25
13
5
19
9
18
12
9
19
9
9
...
14
9
3
9
0
0
0
0
0
0
26
13
5
19
17
18
12
9
19
9
12
...
0
0
0
0
0
0
0
0
0
0
27
13
5
19
9
18
12
9
19
9
12
...
0
0
0
0
0
0
0
0
0
0
28
13
5
19
9
18
12
9
19
9
12
...
0
0
0
0
0
0
0
0
0
0
29
13
5
19
17
18
12
9
19
9
12
...
0
0
0
0
0
0
0
0
0
0
...
...
...
...
...
...
...
...
...
...
...
...
...
...
...
...
...
...
...
...
...
...
547
13
5
19
20
12
12
13
19
19
12
...
14
9
0
0
0
0
0
0
0
0
548
13
5
19
20
18
12
9
19
9
12
...
14
9
0
0
0
0
0
0
0
0
549
13
5
19
1
18
12
9
19
13
12
...
14
9
0
0
0
0
0
0
0
0
550
13
5
19
20
18
12
9
19
9
12
...
14
9
0
0
0
0
0
0
0
0
551
13
5
19
20
18
12
9
19
9
12
...
14
9
0
0
0
0
0
0
0
0
552
13
5
19
20
18
12
9
19
9
12
...
14
9
0
0
0
0
0
0
0
0
553
13
5
19
20
18
12
9
19
9
12
...
14
9
0
0
0
0
0
0
0
0
554
13
5
1
1
19
9
9
19
9
12
...
14
9
0
0
0
0
0
0
0
0
555
13
5
9
19
15
12
13
19
9
12
...
14
9
3
9
0
0
0
0
0
0
556
13
5
9
9
1
12
9
1
9
12
...
14
9
3
9
0
0
0
0
0
0
557
13
5
9
9
15
12
19
19
9
12
...
14
9
3
9
0
0
0
0
0
0
558
13
5
9
9
15
12
19
19
9
12
...
14
9
3
9
0
0
0
0
0
0
559
13
5
20
20
18
12
9
19
9
12
...
14
9
3
9
0
0
0
0
0
0
560
13
5
9
9
18
12
13
19
9
12
...
14
9
3
9
0
0
0
0
0
0
561
13
5
9
19
18
12
13
19
9
12
...
14
9
3
9
0
0
0
0
0
0
562
13
5
19
9
18
12
13
19
9
12
...
14
9
3
9
0
0
0
0
0
0
563
13
5
15
9
18
12
13
19
9
12
...
14
9
3
9
0
0
0
0
0
0
564
13
5
9
9
18
12
13
19
20
12
...
14
9
3
9
0
0
0
0
0
0
565
13
5
20
20
18
12
9
19
9
12
...
14
9
3
9
0
0
0
0
0
0
566
13
5
9
9
15
12
19
19
9
12
...
0
0
0
0
0
0
0
0
0
0
567
13
5
9
9
15
12
13
19
20
12
...
0
0
0
0
0
0
0
0
0
0
568
13
5
19
1
18
12
13
19
9
12
...
14
9
3
9
0
0
0
0
0
0
569
13
5
20
20
18
12
9
19
19
12
...
14
9
3
9
0
0
0
0
0
0
570
13
5
20
20
18
12
9
19
9
12
...
14
9
3
9
0
0
0
0
0
0
571
13
5
19
20
18
12
9
19
9
12
...
14
9
3
9
0
0
0
0
0
0
572
13
5
9
9
18
12
13
19
20
12
...
14
9
3
9
0
0
0
0
0
0
573
13
5
1
9
18
12
13
19
9
12
...
14
9
3
9
0
0
0
0
0
0
574
13
5
19
9
18
12
9
19
9
12
...
0
0
0
0
0
0
0
0
0
0
575
13
5
19
9
18
12
9
19
9
12
...
0
0
0
0
0
0
0
0
0
0
576
13
5
19
9
18
12
9
1
9
12
...
14
9
3
9
0
0
0
0
0
0
577 rows × 455 columns
In [22]:
#
# # Run 1000 runs of the Random Forest classifier, and average the feature importances.
# feature_importance_dict = {pos:[] for pos in encoded_df.columns}
# for i in range(1000):
# rf = RandomForestClassifier()
# rf.fit_transform(encoded_df, labels_wd)
# for pos, importance in zip(encoded_df.columns, rf.feature_importances_):
# feature_importance_dict[pos].append(importance)
# # Get the mean for each feature_importance
# mean_importances_wd = {pos:None for key in feature_importance_dict.keys()}
# for pos, importances in feature_importance_dict.items():
# mean_importances_wd[pos] = np.mean(importances)
In [23]:
def run_rfa(data, labels, n_runs, scatter_color, analysis_name, gene_name):
"""
This function runs the Random Forest Algorithm on an alignment.
Inputs:
- data: a pandas DataFrame with the amino acids aligned and encoded as integers.
- labels: a list of labels
- n_runs: the number of times the Random Forests are to be run.
- scatter_color: the color of the scatterplot dots.
- analysis_name: a string handle labelling the analysis.
- gene_name: the name of the influenza gene.
Outputs:
- SAVE TO DISK:
- A scatter plot of Relative Feature Importance vs. Position in Alignment.
- A CSV file of the relative feature importances.
- RETURN: mean_importances: a dictionary of positions and the mean feature_importances.
"""
feature_importances_dict = {pos:[] for pos in encoded_df.columns}
permuted_importances = []
labels_copy = deepcopy(labels)
for i in range(n_runs):
if i % 20 == 0:
print("Currently at iteration {0}.".format(i))
# Fit-transform based on ground truth labels.
rf = RandomForestClassifier()
rf.fit_transform(data, labels)
for pos, importance in zip(data.columns, rf.feature_importances_):
feature_importances_dict[pos].append(importance)
# Fit-predict on shuffled labels.
shuffle(labels_copy)
rf_shuffled = RandomForestClassifier()
rf_shuffled.fit_transform(data, labels_copy)
for importance in rf_shuffled.feature_importances_:
permuted_importances.append(importance)
# This is where the permutation test is performed.
mean_importances = {pos:None for key in feature_importances_dict.keys()}
threshold = mquantiles(permuted_importances, 0.95)[0]
print("Threshold Importance: {0}".format(threshold))
for pos, importances in feature_importances_dict.items():
if np.mean(importances) > threshold:
mean_importances[pos] = np.mean(importances)
# Generate scatterplot
plt.scatter(mean_importances.keys(), mean_importances.values(), color=scatter_color)
plt.title('{0} \n Positional Importances for {1} Gene'.format(analysis_name, gene_name))
plt.xlabel('Position in Amino Acid Alignment')
plt.ylabel('Relative Feature Importance')
plt.savefig('{0} {1} Positional Feature Importances.pdf'.format(analysis_name, gene_name))
# Generate CSV file of ranked importances
pos_importance = sorted(mean_importances.items(), key=lambda x:x[1])[::-1]
pos_by_importance = [pos for (pos, score) in pos_importance]
importances_df = pd.DataFrame(pos_importance)
importances_df.columns=['Position', 'Relative Importance']
importances_df.to_csv('{0} {1} Relative Importances.csv'.format(analysis_name, gene_name))
return pos_importance, importances_df
In [24]:
def group_proportions_piecharts(counter, pos, groups, analysis_type, figsize):
groups_letters = dict()
for group in list(set(groups)):
groups_letters[group] = [letter for (letter, state) in counter[pos].keys() if state == group]
letters = set([letter for (letter, state) in counter[pos].keys()])
group_proportions = dict()
for group in list(set(groups)):
group_proportions[group] = dict()
for letter in letters:
for group in group_proportions.keys():
if letter in groups_letters[group]:
group_proportions[group][letter] = counter[pos][(letter, group)]
if letter not in groups_letters[group]:
group_proportions[group][letter] = 0
numgroups = len(set(groups))
fig = plt.figure(figsize=figsize)
sorted_groups = sorted(groups, key=lambda x: (x.split('-')[1], x.split('-')[0]) if '-' in x else x)
for group in sorted_groups:
if len(letters) < 3:
bmap = brewer2mpl.get_map('Set3', 'qualitative', 3)
elif len(letters) > 12:
bmap = brewer2mpl.get_map('Set3', 'qualitative', 12)
else:
bmap = brewer2mpl.get_map('Set3', 'qualitative', len(letters))
colors = bmap.mpl_colors
num_cols = 2
num_rows = numgroups // num_cols + 1
position = sorted_groups.index(group) + 1
diversity = sdi(group_proportions[group])
ax = fig.add_subplot(num_rows, num_cols, position)
plt.pie(group_proportions[group].values(), colors=colors, radius=10)
plt.axis('equal')
plt.title('{0}, Pos {1}, \n n={2}, sdi={3}'.format(group, pos, sum(group_proportions[group].values()), round(diversity, 3)))
plt.legend(labels=letters, loc="center left", bbox_to_anchor=(1.0, 0.5), ncol=2)
plt.savefig('{0} {1} Position {2} Proportion of Amino Acids.pdf'.format(analysis_type, gene, pos), bbox_inches='tight')
plt.show()
In [25]:
def normalize_counts(counter):
# Custom function to normalize counts to a proportion from 0 to 1.0.
total = sum(counter.values())
if total != 0:
normalized_counter = {key:float(value/total) for key, value in counter.items()}
else:
normalized_counter = {key:1 for key, value in counter.items()}
return normalized_counter
In [26]:
def cumulative_importances(importances_df, analysis_name):
importances_df.cumsum()['Relative Importance'].plot()
plt.xlabel('Rank Order')
plt.ylabel('Cumulative Importance')
plt.title('{0} Cumulative Importances of\nRanked Amino Acid Positions'.format(analysis_name))
plt.savefig('{0} Cumulative Importances.pdf'.format(analysis_name))
In [27]:
pos_importance_ecotype, importances_ecotype = run_rfa(data=encoded_df,
labels=labels_wd,
n_runs=1000,
scatter_color='r',
analysis_name='Ecotype',
gene_name='HA')
Currently at iteration 0.
Currently at iteration 20.
Currently at iteration 40.
Currently at iteration 60.
Currently at iteration 80.
Currently at iteration 100.
Currently at iteration 120.
Currently at iteration 140.
Currently at iteration 160.
Currently at iteration 180.
Currently at iteration 200.
Currently at iteration 220.
Currently at iteration 240.
Currently at iteration 260.
Currently at iteration 280.
Currently at iteration 300.
Currently at iteration 320.
Currently at iteration 340.
Currently at iteration 360.
Currently at iteration 380.
Currently at iteration 400.
Currently at iteration 420.
Currently at iteration 440.
Currently at iteration 460.
Currently at iteration 480.
Currently at iteration 500.
Currently at iteration 520.
Currently at iteration 540.
Currently at iteration 560.
Currently at iteration 580.
Currently at iteration 600.
Currently at iteration 620.
Currently at iteration 640.
Currently at iteration 660.
Currently at iteration 680.
Currently at iteration 700.
Currently at iteration 720.
Currently at iteration 740.
Currently at iteration 760.
Currently at iteration 780.
Currently at iteration 800.
Currently at iteration 820.
Currently at iteration 840.
Currently at iteration 860.
Currently at iteration 880.
Currently at iteration 900.
Currently at iteration 920.
Currently at iteration 940.
Currently at iteration 960.
Currently at iteration 980.
Threshold Importance: 0.00895522707609
In [28]:
cumulative_importances(importances_ecotype, 'Ecotype')
In [29]:
counts_wd = dict()
for pos in df.columns:
counts_wd[pos] = Counter(zip(df[pos].values, labels_wd))
for pos, importance in pos_importance_ecotype[0:10]:
group_proportions_piecharts(counts_wd, pos, list(set(labels_wd)), 'Ecotype', figsize=(6, 6))
In [30]:
pos_importance_geo, importances_geo = run_rfa(data=encoded_df, labels=labels_geo, n_runs=1000, scatter_color='r', analysis_name='Geography', gene_name='HA')
Currently at iteration 0.
Currently at iteration 20.
Currently at iteration 40.
Currently at iteration 60.
Currently at iteration 80.
Currently at iteration 100.
Currently at iteration 120.
Currently at iteration 140.
Currently at iteration 160.
Currently at iteration 180.
Currently at iteration 200.
Currently at iteration 220.
Currently at iteration 240.
Currently at iteration 260.
Currently at iteration 280.
Currently at iteration 300.
Currently at iteration 320.
Currently at iteration 340.
Currently at iteration 360.
Currently at iteration 380.
Currently at iteration 400.
Currently at iteration 420.
Currently at iteration 440.
Currently at iteration 460.
Currently at iteration 480.
Currently at iteration 500.
Currently at iteration 520.
Currently at iteration 540.
Currently at iteration 560.
Currently at iteration 580.
Currently at iteration 600.
Currently at iteration 620.
Currently at iteration 640.
Currently at iteration 660.
Currently at iteration 680.
Currently at iteration 700.
Currently at iteration 720.
Currently at iteration 740.
Currently at iteration 760.
Currently at iteration 780.
Currently at iteration 800.
Currently at iteration 820.
Currently at iteration 840.
Currently at iteration 860.
Currently at iteration 880.
Currently at iteration 900.
Currently at iteration 920.
Currently at iteration 940.
Currently at iteration 960.
Currently at iteration 980.
Threshold Importance: 0.00791429997177
In [31]:
cumulative_importances(importances_geo, 'Geography')
In [32]:
counts_geo = dict()
for pos in df.columns:
counts_geo[pos] = Counter(zip(df[pos].values, labels_geo))
for pos, importance in pos_importance_geo[0:10]:
group_proportions_piecharts(counts_geo, pos, list(set(labels_geo)), 'Geography', figsize=(6, 17))
In [33]:
pos_importance_species, importances_species = run_rfa(data=encoded_df, labels=labels_species, n_runs=1000, scatter_color='r', analysis_name='Bird Order', gene_name='HA')
counts_species = dict()
for pos in df.columns:
counts_species[pos] = Counter(zip(df[pos].values, labels_species))
Currently at iteration 0.
Currently at iteration 20.
Currently at iteration 40.
Currently at iteration 60.
Currently at iteration 80.
Currently at iteration 100.
Currently at iteration 120.
Currently at iteration 140.
Currently at iteration 160.
Currently at iteration 180.
Currently at iteration 200.
Currently at iteration 220.
Currently at iteration 240.
Currently at iteration 260.
Currently at iteration 280.
Currently at iteration 300.
Currently at iteration 320.
Currently at iteration 340.
Currently at iteration 360.
Currently at iteration 380.
Currently at iteration 400.
Currently at iteration 420.
Currently at iteration 440.
Currently at iteration 460.
Currently at iteration 480.
Currently at iteration 500.
Currently at iteration 520.
Currently at iteration 540.
Currently at iteration 560.
Currently at iteration 580.
Currently at iteration 600.
Currently at iteration 620.
Currently at iteration 640.
Currently at iteration 660.
Currently at iteration 680.
Currently at iteration 700.
Currently at iteration 720.
Currently at iteration 740.
Currently at iteration 760.
Currently at iteration 780.
Currently at iteration 800.
Currently at iteration 820.
Currently at iteration 840.
Currently at iteration 860.
Currently at iteration 880.
Currently at iteration 900.
Currently at iteration 920.
Currently at iteration 940.
Currently at iteration 960.
Currently at iteration 980.
Threshold Importance: 0.00850078905381
In [34]:
cumulative_importances(importances_species, 'Bird Order')
In [35]:
for pos, importance in pos_importance_species[0:10]:
group_proportions_piecharts(counts_species, pos, list(set(labels_species)), 'Bird Order', figsize=(6,6))
In [36]:
pos_importance_wd_species, importances_wd_species = run_rfa(data=encoded_df, labels=labels_wd_species, n_runs=1000, scatter_color='r', analysis_name='Ecotype and Bird Order', gene_name='HA')
Currently at iteration 0.
Currently at iteration 20.
Currently at iteration 40.
Currently at iteration 60.
Currently at iteration 80.
Currently at iteration 100.
Currently at iteration 120.
Currently at iteration 140.
Currently at iteration 160.
Currently at iteration 180.
Currently at iteration 200.
Currently at iteration 220.
Currently at iteration 240.
Currently at iteration 260.
Currently at iteration 280.
Currently at iteration 300.
Currently at iteration 320.
Currently at iteration 340.
Currently at iteration 360.
Currently at iteration 380.
Currently at iteration 400.
Currently at iteration 420.
Currently at iteration 440.
Currently at iteration 460.
Currently at iteration 480.
Currently at iteration 500.
Currently at iteration 520.
Currently at iteration 540.
Currently at iteration 560.
Currently at iteration 580.
Currently at iteration 600.
Currently at iteration 620.
Currently at iteration 640.
Currently at iteration 660.
Currently at iteration 680.
Currently at iteration 700.
Currently at iteration 720.
Currently at iteration 740.
Currently at iteration 760.
Currently at iteration 780.
Currently at iteration 800.
Currently at iteration 820.
Currently at iteration 840.
Currently at iteration 860.
Currently at iteration 880.
Currently at iteration 900.
Currently at iteration 920.
Currently at iteration 940.
Currently at iteration 960.
Currently at iteration 980.
Threshold Importance: 0.00846683497447
In [37]:
cumulative_importances(importances_wd_species, 'Ecotype and Bird Order')
In [38]:
counts_wd_species = dict()
for pos in df.columns:
counts_wd_species[pos] = Counter(zip(df[pos].values, labels_wd_species))
for pos, importance in pos_importance_wd_species[0:10]:
group_proportions_piecharts(counts_wd_species, pos, list(set(labels_wd_species)), 'Ecotype and Bird Order', figsize=(6,10))
In [39]:
pos_importance_wd_geo, importances_wd_geo = run_rfa(data=encoded_df, labels=labels_wd_geo, n_runs=1000, scatter_color='r', analysis_name='Ecotype and Geography', gene_name='HA')
Currently at iteration 0.
Currently at iteration 20.
Currently at iteration 40.
Currently at iteration 60.
Currently at iteration 80.
Currently at iteration 100.
Currently at iteration 120.
Currently at iteration 140.
Currently at iteration 160.
Currently at iteration 180.
Currently at iteration 200.
Currently at iteration 220.
Currently at iteration 240.
Currently at iteration 260.
Currently at iteration 280.
Currently at iteration 300.
Currently at iteration 320.
Currently at iteration 340.
Currently at iteration 360.
Currently at iteration 380.
Currently at iteration 400.
Currently at iteration 420.
Currently at iteration 440.
Currently at iteration 460.
Currently at iteration 480.
Currently at iteration 500.
Currently at iteration 520.
Currently at iteration 540.
Currently at iteration 560.
Currently at iteration 580.
Currently at iteration 600.
Currently at iteration 620.
Currently at iteration 640.
Currently at iteration 660.
Currently at iteration 680.
Currently at iteration 700.
Currently at iteration 720.
Currently at iteration 740.
Currently at iteration 760.
Currently at iteration 780.
Currently at iteration 800.
Currently at iteration 820.
Currently at iteration 840.
Currently at iteration 860.
Currently at iteration 880.
Currently at iteration 900.
Currently at iteration 920.
Currently at iteration 940.
Currently at iteration 960.
Currently at iteration 980.
Threshold Importance: 0.00789190492276
In [40]:
cumulative_importances(importances_wd_geo, 'Ecotype and Geography')
In [75]:
counts_wd_geo = dict()
for pos in df.columns:
counts_wd_geo[pos] = Counter(zip(df[pos].values, labels_wd_geo))
# For completeness, we add in the following label
missing_labels = ['W-China.West', 'W-SE.Asia', 'D-N.Amer', 'W-S.Asia']
for pos, importance in pos_importance_wd_geo[0:10]:
group_proportions_piecharts(counts_wd_geo, pos, set(labels_wd_geo), 'Ecotype and Geography',
figsize=(6, 30))
In [42]:
pos_importance_wd_geo_species, importances_wd_geo_species = run_rfa(data=encoded_df,
labels=labels_wd_geo_species,
n_runs=1000,
scatter_color='r',
analysis_name='Ecotype, Geography and Bird Order',
gene_name='HA')
Currently at iteration 0.
Currently at iteration 20.
Currently at iteration 40.
Currently at iteration 60.
Currently at iteration 80.
Currently at iteration 100.
Currently at iteration 120.
Currently at iteration 140.
Currently at iteration 160.
Currently at iteration 180.
Currently at iteration 200.
Currently at iteration 220.
Currently at iteration 240.
Currently at iteration 260.
Currently at iteration 280.
Currently at iteration 300.
Currently at iteration 320.
Currently at iteration 340.
Currently at iteration 360.
Currently at iteration 380.
Currently at iteration 400.
Currently at iteration 420.
Currently at iteration 440.
Currently at iteration 460.
Currently at iteration 480.
Currently at iteration 500.
Currently at iteration 520.
Currently at iteration 540.
Currently at iteration 560.
Currently at iteration 580.
Currently at iteration 600.
Currently at iteration 620.
Currently at iteration 640.
Currently at iteration 660.
Currently at iteration 680.
Currently at iteration 700.
Currently at iteration 720.
Currently at iteration 740.
Currently at iteration 760.
Currently at iteration 780.
Currently at iteration 800.
Currently at iteration 820.
Currently at iteration 840.
Currently at iteration 860.
Currently at iteration 880.
Currently at iteration 900.
Currently at iteration 920.
Currently at iteration 940.
Currently at iteration 960.
Currently at iteration 980.
Threshold Importance: 0.0078327763077
In [43]:
cumulative_importances(importances_wd_geo_species, 'Ecotype, Geography and Bird Order')
In [76]:
# set(labels_wd), set(labels_geo), set(labels_species)
# complete_labels = []
# for wd in set(labels_wd):
# for geo in set(labels_geo):
# for species in set(labels_species):
# complete_labels.append(wd + "_" + geo + "_" + species)
# complete_labels
In [73]:
counts_wd_geo_species = dict()
for pos in df.columns:
counts_wd_geo_species[pos] = Counter(zip(df[pos].values, labels_wd_geo_species))
for pos, importance in pos_importance_wd_geo_species[0:10]:
group_proportions_piecharts(counts_wd_geo_species, pos, set(labels_wd_geo_species), 'Ecotype, Geography and Bird Order',
figsize=(10, 55))
In [ ]:
Content source: ericmjl/H9N2
Similar notebooks: